provider.py 880 字节
Newer Older
D
dangqingqing 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
import io,os
import random
import numpy as np
from paddle.trainer.PyDataProvider2 import *

def initHook(settings, height, width, color, num_class, **kwargs):
    settings.height = height 
    settings.width = width 
    settings.color = color 
    settings.num_class = num_class 
    if settings.color:
        settings.data_size = settings.height * settings.width * 3
    else:
        settings.data_size = settings.height * settings.width

    settings.slots = [dense_vector(settings.data_size), integer_value(1)]

@provider(init_hook=initHook, min_pool_size=-1, cache=CacheType.CACHE_PASS_IN_MEM)
def process(settings, file_list):
    with open(file_list, 'r') as fdata:
        for line in fdata:
            img = np.random.rand(1, settings.data_size).reshape(-1, 1).flatten()
            lab = random.randint(0, settings.num_class)
            yield img.tolist(), int(lab)