diff --git a/cn/index.html b/cn/index.html index ce93718cd98834b40b2109dde246e09569b52a4b..be5171318464e6f8ddcec89b8bb9a82ae83a2622 100644 --- a/cn/index.html +++ b/cn/index.html @@ -90,7 +90,7 @@ var _hmt = _hmt || [];
开放易用的深度学习平台,工业应用与学术研究并举
- 快速上手 + 深度学习入门 文档 代码 diff --git a/develop/doc/.buildinfo b/develop/doc/.buildinfo new file mode 100644 index 0000000000000000000000000000000000000000..fde5b8bfbc436bbc4a03de16618279f8cdd8f28b --- /dev/null +++ b/develop/doc/.buildinfo @@ -0,0 +1,4 @@ +# Sphinx build info version 1 +# This file hashes the configuration used when building these files. When it is not found, a full rebuild will be done. +config: 4d7a146cda87e1e0222ce8a24b0ea6b4 +tags: 645f666f9bcd5a90fca523b33c5a78b7 diff --git a/develop/doc/_images/FullyConnected.jpg b/develop/doc/_images/FullyConnected.jpg new file mode 100644 index 0000000000000000000000000000000000000000..b2241f401434e527f95ee4e0e541a3f2ff78fd1e Binary files /dev/null and b/develop/doc/_images/FullyConnected.jpg differ diff --git a/develop/doc/_images/NetContinuous_en.png b/develop/doc/_images/NetContinuous_en.png new file mode 100644 index 0000000000000000000000000000000000000000..7bdef1aa366711806585d35c8653c987fd63d59e Binary files /dev/null and b/develop/doc/_images/NetContinuous_en.png differ diff --git a/develop/doc/_images/NetConv_en.png b/develop/doc/_images/NetConv_en.png new file mode 100644 index 0000000000000000000000000000000000000000..ad618d1d6f8f4839f566f5f5cb5db37a4b7d9093 Binary files /dev/null and b/develop/doc/_images/NetConv_en.png differ diff --git a/develop/doc/_images/NetLR_en.png b/develop/doc/_images/NetLR_en.png new file mode 100644 index 0000000000000000000000000000000000000000..9d514bf1b18a0c330f98c28785e5d008f409fc1d Binary files /dev/null and b/develop/doc/_images/NetLR_en.png differ diff --git a/develop/doc/_images/NetRNN_en.png b/develop/doc/_images/NetRNN_en.png new file mode 100644 index 0000000000000000000000000000000000000000..180f273d32ea59dc8ececa69c08e249f79f9d4f7 Binary files /dev/null and b/develop/doc/_images/NetRNN_en.png differ diff --git a/develop/doc/_images/PipelineNetwork_en.jpg b/develop/doc/_images/PipelineNetwork_en.jpg new file mode 100644 index 0000000000000000000000000000000000000000..e779aed06d5cdb2b442754e7915e79b72946418e Binary files /dev/null and b/develop/doc/_images/PipelineNetwork_en.jpg differ diff --git a/develop/doc/_images/PipelineTest_en.png b/develop/doc/_images/PipelineTest_en.png new file mode 100644 index 0000000000000000000000000000000000000000..7e7ef520b5effa2f43fd2964048f05c42f2ea890 Binary files /dev/null and b/develop/doc/_images/PipelineTest_en.png differ diff --git a/develop/doc/_images/PipelineTrain_en.png b/develop/doc/_images/PipelineTrain_en.png new file mode 100644 index 0000000000000000000000000000000000000000..132d29bfd5d678d2518161d0b5ed2e16a233a048 Binary files /dev/null and b/develop/doc/_images/PipelineTrain_en.png differ diff --git a/develop/doc/_images/Pipeline_en.jpg b/develop/doc/_images/Pipeline_en.jpg new file mode 100644 index 0000000000000000000000000000000000000000..21a7a7bb6a1af746120e6f4f51f797b6aaafb9d8 Binary files /dev/null and b/develop/doc/_images/Pipeline_en.jpg differ diff --git a/develop/doc/_images/add_security_group.png b/develop/doc/_images/add_security_group.png new file mode 100644 index 0000000000000000000000000000000000000000..bd34f46c9b0ada7027fd53e553e7d033255d25fc Binary files /dev/null and b/develop/doc/_images/add_security_group.png differ diff --git a/develop/doc/_images/bi_lstm.jpg b/develop/doc/_images/bi_lstm.jpg new file mode 100644 index 0000000000000000000000000000000000000000..adec1606d64d6e35ffe7e62abfa9a09309b05c84 Binary files /dev/null and b/develop/doc/_images/bi_lstm.jpg differ diff --git a/develop/doc/_images/bi_lstm1.jpg b/develop/doc/_images/bi_lstm1.jpg new file mode 100644 index 0000000000000000000000000000000000000000..adec1606d64d6e35ffe7e62abfa9a09309b05c84 Binary files /dev/null and b/develop/doc/_images/bi_lstm1.jpg differ diff --git a/develop/doc/_images/cifar.png b/develop/doc/_images/cifar.png new file mode 100644 index 0000000000000000000000000000000000000000..f54a0c58837cb3385b32dc57d02cec92666ef0f1 Binary files /dev/null and b/develop/doc/_images/cifar.png differ diff --git a/develop/doc/_images/create_efs.png b/develop/doc/_images/create_efs.png new file mode 100644 index 0000000000000000000000000000000000000000..e5f1526033d1daf401700989af1d25919bcb7675 Binary files /dev/null and b/develop/doc/_images/create_efs.png differ diff --git a/develop/doc/_images/curve.jpg b/develop/doc/_images/curve.jpg new file mode 100644 index 0000000000000000000000000000000000000000..baa35ae7f0a0b6c246f3a0d331735477ab8bcd70 Binary files /dev/null and b/develop/doc/_images/curve.jpg differ diff --git a/develop/doc/_images/encoder-decoder-attention-model.png b/develop/doc/_images/encoder-decoder-attention-model.png new file mode 100644 index 0000000000000000000000000000000000000000..79f911d4ba12ac0c0d1a936c9df639c302786914 Binary files /dev/null and b/develop/doc/_images/encoder-decoder-attention-model.png differ diff --git a/develop/doc/_images/encoder-decoder-attention-model1.png b/develop/doc/_images/encoder-decoder-attention-model1.png new file mode 100644 index 0000000000000000000000000000000000000000..79f911d4ba12ac0c0d1a936c9df639c302786914 Binary files /dev/null and b/develop/doc/_images/encoder-decoder-attention-model1.png differ diff --git a/develop/doc/_images/feature.jpg b/develop/doc/_images/feature.jpg new file mode 100644 index 0000000000000000000000000000000000000000..0e3310e4ace5613917e7779d3198ccbb3cdc5ada Binary files /dev/null and b/develop/doc/_images/feature.jpg differ diff --git a/develop/doc/_images/gan.png b/develop/doc/_images/gan.png new file mode 100644 index 0000000000000000000000000000000000000000..0eafd7cb49b545f412f8e775804bcd0b22c42454 Binary files /dev/null and b/develop/doc/_images/gan.png differ diff --git a/develop/doc/_images/image_classification.png b/develop/doc/_images/image_classification.png new file mode 100644 index 0000000000000000000000000000000000000000..14f255805081c1b4fab27eaf336fd389fa93ca19 Binary files /dev/null and b/develop/doc/_images/image_classification.png differ diff --git a/develop/doc/_images/lenet.png b/develop/doc/_images/lenet.png new file mode 100644 index 0000000000000000000000000000000000000000..1e6f2b32bad797f3fccb929c72a121fc935b0cbb Binary files /dev/null and b/develop/doc/_images/lenet.png differ diff --git a/develop/doc/_images/lstm.png b/develop/doc/_images/lstm.png new file mode 100644 index 0000000000000000000000000000000000000000..aaf1fc690da2ffb8418cde5ed81848ddb5263030 Binary files /dev/null and b/develop/doc/_images/lstm.png differ diff --git a/develop/doc/_images/mnist_sample.png b/develop/doc/_images/mnist_sample.png new file mode 100644 index 0000000000000000000000000000000000000000..f9c7bf7ddd7f148eac4fe347e9c38afaa8876760 Binary files /dev/null and b/develop/doc/_images/mnist_sample.png differ diff --git a/develop/doc/_images/network_arch.png b/develop/doc/_images/network_arch.png new file mode 100644 index 0000000000000000000000000000000000000000..4ae7864212f2a0a38102ee7ff600527ea99fec82 Binary files /dev/null and b/develop/doc/_images/network_arch.png differ diff --git a/develop/doc/_images/neural-n-gram-model.png b/develop/doc/_images/neural-n-gram-model.png new file mode 100644 index 0000000000000000000000000000000000000000..f70b765b3fd69816345a79fc59adfea46008dbfd Binary files /dev/null and b/develop/doc/_images/neural-n-gram-model.png differ diff --git a/develop/doc/_images/nvvp1.png b/develop/doc/_images/nvvp1.png new file mode 100644 index 0000000000000000000000000000000000000000..1af23ac3c52929b2b0645d2f9fa4d4c6db1f6e77 Binary files /dev/null and b/develop/doc/_images/nvvp1.png differ diff --git a/develop/doc/_images/nvvp2.png b/develop/doc/_images/nvvp2.png new file mode 100644 index 0000000000000000000000000000000000000000..177c9db708da6863d1075f3e615f5962dbe18b29 Binary files /dev/null and b/develop/doc/_images/nvvp2.png differ diff --git a/develop/doc/_images/nvvp3.png b/develop/doc/_images/nvvp3.png new file mode 100644 index 0000000000000000000000000000000000000000..d8f393667d6569b6f1e61ffccac43fae5888b6db Binary files /dev/null and b/develop/doc/_images/nvvp3.png differ diff --git a/develop/doc/_images/nvvp4.png b/develop/doc/_images/nvvp4.png new file mode 100644 index 0000000000000000000000000000000000000000..51f2f3e183295de6cf8ddaf2b3b8a0862aa35f01 Binary files /dev/null and b/develop/doc/_images/nvvp4.png differ diff --git a/develop/doc/_images/parameters.png b/develop/doc/_images/parameters.png new file mode 100644 index 0000000000000000000000000000000000000000..2ec67480951e21f0400bce1c34b3108dcd65c18c Binary files /dev/null and b/develop/doc/_images/parameters.png differ diff --git a/develop/doc/_images/plot.png b/develop/doc/_images/plot.png new file mode 100644 index 0000000000000000000000000000000000000000..a31f99791c670e18bb8c62b7604ec8cb0284ffb4 Binary files /dev/null and b/develop/doc/_images/plot.png differ diff --git a/develop/doc/_images/pserver_and_trainer.png b/develop/doc/_images/pserver_and_trainer.png new file mode 100644 index 0000000000000000000000000000000000000000..f41fe48920590333ad332bb51eb18e03dc251541 Binary files /dev/null and b/develop/doc/_images/pserver_and_trainer.png differ diff --git a/develop/doc/_images/rec_regression_network.png b/develop/doc/_images/rec_regression_network.png new file mode 100644 index 0000000000000000000000000000000000000000..7d2b54d4fcf560cd5b667628f0012c3822efd9b2 Binary files /dev/null and b/develop/doc/_images/rec_regression_network.png differ diff --git a/develop/doc/_images/resnet_block.jpg b/develop/doc/_images/resnet_block.jpg new file mode 100644 index 0000000000000000000000000000000000000000..e16bd3c624030c4c09b358a015b491141b42d8f1 Binary files /dev/null and b/develop/doc/_images/resnet_block.jpg differ diff --git a/develop/doc/_images/route53_create_recordset.png b/develop/doc/_images/route53_create_recordset.png new file mode 100644 index 0000000000000000000000000000000000000000..34e476c7beac30fcdde13fccc4cc8d08b4be3d35 Binary files /dev/null and b/develop/doc/_images/route53_create_recordset.png differ diff --git a/develop/doc/_images/route53_create_zone.png b/develop/doc/_images/route53_create_zone.png new file mode 100644 index 0000000000000000000000000000000000000000..25b7ddb831c5cba97f4b2edddd27da3234d621af Binary files /dev/null and b/develop/doc/_images/route53_create_zone.png differ diff --git a/develop/doc/_images/stacked_lstm.jpg b/develop/doc/_images/stacked_lstm.jpg new file mode 100644 index 0000000000000000000000000000000000000000..4239055050966e0095e188a8c81d860711bce29d Binary files /dev/null and b/develop/doc/_images/stacked_lstm.jpg differ diff --git a/develop/doc/_images/uniform_sample.png b/develop/doc/_images/uniform_sample.png new file mode 100644 index 0000000000000000000000000000000000000000..e716c48e782019a757bed0cb443f2ed97386cbe2 Binary files /dev/null and b/develop/doc/_images/uniform_sample.png differ diff --git a/develop/doc/_images/worker_security_group.png b/develop/doc/_images/worker_security_group.png new file mode 100644 index 0000000000000000000000000000000000000000..57eb0265a34ad4223b69600d2a3dd355482e0bf5 Binary files /dev/null and b/develop/doc/_images/worker_security_group.png differ diff --git a/develop/doc/_sources/about/index_en.rst.txt b/develop/doc/_sources/about/index_en.rst.txt new file mode 100644 index 0000000000000000000000000000000000000000..065c430cdea802ed3c9f487cd00255b85a5598a5 --- /dev/null +++ b/develop/doc/_sources/about/index_en.rst.txt @@ -0,0 +1,14 @@ +ABOUT +======= + +PaddlPaddle is an easy-to-use, efficient, flexible and scalable deep learning platform, +which is originally developed by Baidu scientists and engineers for the purpose of applying deep learning to many products at Baidu. + +PaddlePaddle is now open source but far from complete, which is intended to be built upon, improved, scaled, and extended. +We hope to build an active open source community both by providing feedback and by actively contributing to the source code. + + +Credits +-------- + +We owe many thanks to `all contributors and developersOptional | +Description | +
---|---|
WITH_GPU | Compile PaddlePaddle with NVIDIA GPU |
WITH_AVX | Compile PaddlePaddle with AVX intrinsics |
WITH_DSO | Compile PaddlePaddle with dynamic linked CUDA |
WITH_TESTING | Compile PaddlePaddle with unit testing |
WITH_SWIG_PY | Compile PaddlePaddle with inference api |
WITH_STYLE_CHECK | Compile PaddlePaddle with style check |
WITH_PYTHON | Compile PaddlePaddle with python interpreter |
WITH_DOUBLE | Compile PaddlePaddle with double precision |
WITH_RDMA | Compile PaddlePaddle with RDMA support |
WITH_TIMER | Compile PaddlePaddle with stats timer |
WITH_PROFILER | Compile PaddlePaddle with GPU profiler |
WITH_DOC | Compile PaddlePaddle with documentation |
ON_COVERALLS | Compile PaddlePaddle with code coverage |
COVERALLS_UPLOAD | Package code coverage data to coveralls |
ON_TRAVIS | Exclude special unit test on Travis CI |
+ | args | +local train | +cluster train | +local test | +cluster test | +
---|---|---|---|---|---|
common | +job | +√ | √ | √ | √ | +
use_gpu | +√ | √ | √ | √ | +|
local | +√ | √ | √ | √ | +|
config | +√ | √ | √ | √ | +|
config_args | +√ | √ | √ | √ | +|
num_passes | +√ | √ | √ | √ | +|
trainer_count | +√ | √ | √ | √ | +|
version | +√ | √ | √ | √ | +|
show_layer_stat | +√ | √ | √ | √ | +|
train | dot_period | +√ | √ | + | |
test_period | +√ | √ | + | ||
saving_period | +√ | √ | + | ||
show_parameter_stats_period | +√ | √ | + | ||
init_model_path | +√ | √ | √ | + | |
load_missing_parameter_strategy | +√ | √ | + | ||
saving_period_by_batches | +√ | √ | + | ||
use_old_updater | +√ | √ | + | ||
enable_grad_share | +√ | √ | + | ||
grad_share_block_num | +√ | √ | + | ||
log_error_clipping | +√ | √ | + | ||
log_clipping | +√ | √ | + | ||
save_only_one | +√ | √ | + | ||
start_pass | +√ | √ | + | ||
train/test | save_dir | +√ | √ | √ | √ | +
testing during training | test_period | +√ | √ | + | |
average_test_period | +√ | √ | + | ||
test | model_list | +√ | √ | +||
test_wait | +√ | √ | +|||
test_pass | +√ | √ | +|||
predict_output_dir | +√ | √ | +|||
distribute_test | +√ | √ | +|||
Auc/PnpairValidation | predict_file | +√ | √ | +||
GPU | gpu_id | +√ | √ | √ | √ | +
parallel_nn | +√ | √ | √ | √ | +|
allow_only_one_model_on_one_gpu | +√ | √ | √ | √ | +|
cudnn_dir | +√ | √ | √ | √ | +|
cuda_dir | +√ | √ | √ | √ | +|
cudnn_conv_workspace_limit_in_mb | +√ | √ | √ | √ | +|
RNN | +beam_size | +√ | √ | +||
rnn_use_batch | +√ | √ | √ | √ | +|
prev_batch_state | +√ | √ | + | ||
diy_beam_search_prob_so | +√ | √ | +|||
metric learning | external | +√ | √ | √ | √ | +
data_server_port | +√ | √ | +|||
PServer | start_pserver | +√ | √ | +||
pservers | +√ | √ | +|||
port | +√ | √ | +|||
port_num | +√ | √ | +|||
ports_num_for_sparse | +√ | √ | +|||
nics | +√ | √ | +|||
rdma_tcp | +√ | √ | +|||
small_messages | +√ | + | |||
loadsave_parameters_in_pserver | +√ | √ | +|||
log_period_server | +√ | + | |||
pserver_num_threads | +√ | + | |||
sock_send_buf_size | +√ | + | |||
sock_recv_buf_size | +√ | + | |||
num_gradient_servers | +√ | + | |||
parameter_block_size | +√ | + | |||
parameter_block_size_for_sparse | +√ | + | |||
Async SGD | async_count | +√ | + | ||
async_lagged_ratio_min | +√ | + | |||
async_lagged_ratio_default | +√ | + | |||
Performance Tuning | log_barrier_abstract | +√ | + | ||
log_barrier_lowest_nodes | +√ | + | |||
log_barrier_show_log | +√ | + | |||
check_sparse_distribution_batches | +√ | + | |||
check_sparse_distribution_ratio | +√ | + | |||
check_sparse_distribution_unbalance_degree | +√ | + | |||
check_sparse_distribution_in_pserver | +√ | + | |||
show_check_sparse_distribution_log | +√ | + | |||
Data Provider | memory_threshold_on_load_data | +√ | √ | + | |
RandomNumber | seed | +√ | √ | + | |
thread_local_rand_use_global_seed | +√ | √ | + | ||
UnitTest | checkgrad_eps | ++ | |||
Matrix/Vector | enable_parallel_vector | +√ | √ | √ | √ | +
+ Figure 1. GAN-Model-Structure + figure credit +
+ +The generator and discriminator take turn to be trained using SGD. The objective function of the generator is for its generated images being classified as real by the discriminator, and the objective function of the discriminator is to correctly classify real and fake images. When the GAN model is trained to converge to the equilibrium state, the generator will transform the given noise distribution to the distribution of real images, and the discriminator will not be able to distinguish between real and fake images at all. + +## Implementation of GAN Model Structure +Since GAN model involves multiple neural networks, it requires to use paddle python API. So the code walk-through below can also partially serve as an introduction to the usage of Paddle Python API. + +There are three networks defined in gan_conf.py, namely **generator_training**, **discriminator_training** and **generator**. The relationship to the model structure we defined above is that **discriminator_training** is the discriminator, **generator** is the generator, and the **generator_training** combined the generator and discriminator since training generator would require the discriminator to provide loss function. This relationship is described in the following code: +```python +if is_generator_training: + noise = data_layer(name="noise", size=noise_dim) + sample = generator(noise) + +if is_discriminator_training: + sample = data_layer(name="sample", size=sample_dim) + +if is_generator_training or is_discriminator_training: + label = data_layer(name="label", size=1) + prob = discriminator(sample) + cost = cross_entropy(input=prob, label=label) + classification_error_evaluator( + input=prob, label=label, name=mode + '_error') + outputs(cost) + +if is_generator: + noise = data_layer(name="noise", size=noise_dim) + outputs(generator(noise)) +``` + +In order to train the networks defined in gan_conf.py, one first needs to initialize a Paddle environment, parse the config, create GradientMachine from the config and create trainer from GradientMachine as done in the code chunk below: +```python +import py_paddle.swig_paddle as api +# init paddle environment +api.initPaddle('--use_gpu=' + use_gpu, '--dot_period=10', + '--log_period=100', '--gpu_id=' + args.gpu_id, + '--save_dir=' + "./%s_params/" % data_source) + +# Parse config +gen_conf = parse_config(conf, "mode=generator_training,data=" + data_source) +dis_conf = parse_config(conf, "mode=discriminator_training,data=" + data_source) +generator_conf = parse_config(conf, "mode=generator,data=" + data_source) + +# Create GradientMachine +dis_training_machine = api.GradientMachine.createFromConfigProto( +dis_conf.model_config) +gen_training_machine = api.GradientMachine.createFromConfigProto( +gen_conf.model_config) +generator_machine = api.GradientMachine.createFromConfigProto( +generator_conf.model_config) + +# Create trainer +dis_trainer = api.Trainer.create(dis_conf, dis_training_machine) +gen_trainer = api.Trainer.create(gen_conf, gen_training_machine) +``` + +In order to balance the strength between generator and discriminator, we schedule to train whichever one is performing worse by comparing their loss function value. The loss function value can be calculated by a forward pass through the GradientMachine. +```python +def get_training_loss(training_machine, inputs): + outputs = api.Arguments.createArguments(0) + training_machine.forward(inputs, outputs, api.PASS_TEST) + loss = outputs.getSlotValue(0).copyToNumpyMat() + return numpy.mean(loss) +``` + +After training one network, one needs to sync the new parameters to the other networks. The code below demonstrates one example of such use case: +```python +# Train the gen_training +gen_trainer.trainOneDataBatch(batch_size, data_batch_gen) + +# Copy the parameters from gen_training to dis_training and generator +copy_shared_parameters(gen_training_machine, +dis_training_machine) +copy_shared_parameters(gen_training_machine, generator_machine) +``` + + +## A Toy Example +With the infrastructure explained above, we can now walk you through a toy example of generating two dimensional uniform distribution using 10 dimensional Gaussian noise. + +The Gaussian noises are generated using the code below: +```python +def get_noise(batch_size, noise_dim): + return numpy.random.normal(size=(batch_size, noise_dim)).astype('float32') +``` + +The real samples (2-D uniform) are generated using the code below: +```python +# synthesize 2-D uniform data in gan_trainer.py:114 +def load_uniform_data(): + data = numpy.random.rand(1000000, 2).astype('float32') + return data +``` + +The generator and discriminator network are built using fully-connected layer and batch_norm layer, and are defined in gan_conf.py. + +To train the GAN model, one can use the command below. The flag -d specifies the training data (cifar, mnist or uniform) and flag --useGpu specifies whether to use gpu for training (0 is cpu, 1 is gpu). +```bash +$python gan_trainer.py -d uniform --useGpu 1 +``` +The generated samples can be found in ./uniform_samples/ and one example is shown below as Figure 2. One can see that it roughly recovers the 2D uniform distribution. + ++ Figure 2. Uniform Sample +
+ +## MNIST Example +### Data preparation +To download the MNIST data, one can use the following commands: +```bash +$cd data/ +$./get_mnist_data.sh +``` + +### Model description +Following the DC-Gan paper (https://arxiv.org/abs/1511.06434), we use convolution/convolution-transpose layer in the discriminator/generator network to better deal with images. The details of the network structures are defined in gan_conf_image.py. + +### Training the model +To train the GAN model on mnist data, one can use the following command: +```bash +$python gan_trainer.py -d mnist --useGpu 1 +``` +The generated sample images can be found at ./mnist_samples/ and one example is shown below as Figure 3. ++ Figure 3. MNIST Sample +
diff --git a/develop/doc/_sources/tutorials/image_classification/index_en.md.txt b/develop/doc/_sources/tutorials/image_classification/index_en.md.txt new file mode 100644 index 0000000000000000000000000000000000000000..60c81a6a539944634773f38ec4c9a59709dd4afc --- /dev/null +++ b/develop/doc/_sources/tutorials/image_classification/index_en.md.txt @@ -0,0 +1,221 @@ +Image Classification Tutorial +============================== + +This tutorial will guide you through training a convolutional neural network to classify objects using the CIFAR-10 image classification dataset. +As shown in the following figure, the convolutional neural network can recognize the main object in images, and output the classification result. + +ResNet | +Top-1 | +Model Size | +
---|---|---|
ResNet-50 | +24.9% | +99M | +
ResNet-101 | +23.7% | +173M | +
ResNet-152 | +23.2% | +234M | +
Parameter Name | +Number | +Meaning | +
---|---|---|
_res2_1_branch1_bn.w0 | +256 | +gamma, scale parameter | +
_res2_1_branch1_bn.w1 | +256 | +mean value of feature map | +
_res2_1_branch1_bn.w2 | +256 | +variance of feature map | +
_res2_1_branch1_bn.wbias | +256 | +beta, shift parameter | +
Network name | +Number of parameters | +Test error | + + + + +
---|---|---|
Logistic regression | +252 KB | +8.652% | +
Network name | +Number of parameters | +Test error | + + + + +
---|---|---|
Word embedding model | +15 MB | +8.484% | +
Network name | +Number of parameters | +Test error | + + + + +
---|---|---|
Convolutional model | +16 MB | +5.628% | +
Network name | +Number of parameters | +Test error | + + + + +
---|---|---|
Recurrent model | +16 MB | +4.812% | +
Network name | +Number of parameters | +Error rate | +Configuration file name | + + + + +
---|---|---|---|
Logistic regression model(BOW) | +252KB | +8.652% | +trainer_config.lr.py | +
Word embedding | +15MB | +8.484% | +trainer_config.emb.py | +
Convolution model | +16MB | +5.628% | +trainer_config.cnn.py | +
Time sequence model | +16MB | +4.812% | +trainer_config.lstm.py | +
Name | +Explanation | + + + +
---|---|
Batch=20 | +You have trained 20 batches. | +
samples=2560 | +You have trained 2560 examples. | +
AvgCost | +The average cost from the first batch to the current batch. | +
CurrentCost | +the average cost of the last log_period batches | +
Eval: classification_error_evaluator | +The average classification error from the first batch to the current batch. | +
CurrentEval: classification_error_evaluator | +The average error rate of the last log_period batches | +
folder name | +French-English parallel corpora file | +number of total file | +size | +
---|---|---|---|
train_data | +ccb2_pc30.src, ccb2_pc30.trg, etc | +twelve | +3.55G | +
test_data | +ntst1213.src, ntst1213.trg | +two | +1636k | +
gen_data | +ntst14.src, ntst14.trg | +two | +864k | +