from paddle.trainer_config_helpers import * from paddle.trainer.PyDataProvider2 import dense_vector, integer_value import paddle.v2 as paddle_v2 import numpy import mnist_util def train_reader(): train_file = './data/raw_data/train' generator = mnist_util.read_from_mnist(train_file) for item in generator: yield item def network_config(): imgs = data_layer(name='pixel', size=784) hidden1 = fc_layer(input=imgs, size=200) hidden2 = fc_layer(input=hidden1, size=200) inference = fc_layer(input=hidden2, size=10, act=SoftmaxActivation()) cost = classification_cost( input=inference, label=data_layer( name='label', size=10)) outputs(cost) def event_handler(event): if isinstance(event, paddle_v2.trainer.CompleteTrainOneBatch): print "Pass %d, Batch %d, Cost %f" % (event.pass_id, event.batch_id, event.cost) else: pass def main(): paddle_v2.init(use_gpu=False, trainer_count=1) model_config = parse_network_config(network_config) pool = paddle_v2.parameters.create(model_config) for param_name in pool.get_names(): array = pool.get_parameter(param_name) array[:] = numpy.random.uniform(low=-1.0, high=1.0, size=array.shape) trainer = paddle_v2.trainer.SGDTrainer( update_equation=paddle_v2.optimizer.Adam( learning_rate=1e-4, model_average=ModelAverage(average_window=0.5), regularization=L2Regularization(rate=0.5))) trainer.train(train_data_reader=train_reader, topology=model_config, parameters=pool, event_handler=event_handler, batch_size=32, # batch size should be refactor in Data reader data_types={ # data_types will be removed, It should be in # network topology 'pixel': dense_vector(784), 'label': integer_value(10) }) if __name__ == '__main__': main()