GPU训练时候报错
Created by: sarawon
root@gputest:~/demo/mnist# sh train.sh
Using debug command gdb --args
GNU gdb (Ubuntu 7.7.1-0ubuntu5~14.04.2) 7.7.1
Copyright (C) 2014 Free Software Foundation, Inc.
License GPLv3+: GNU GPL version 3 or later <http://gnu.org/licenses/gpl.html>
This is free software: you are free to change and redistribute it.
There is NO WARRANTY, to the extent permitted by law. Type "show copying"
and "show warranty" for details.
This GDB was configured as "x86_64-linux-gnu".
Type "show configuration" for configuration details.
For bug reporting instructions, please see:
<http://www.gnu.org/software/gdb/bugs/>.
Find the GDB manual and other documentation resources online at:
<http://www.gnu.org/software/gdb/documentation/>.
For help, type "help".
Type "apropos word" to search for commands related to "word"...
Reading symbols from /usr/bin/../opt/paddle/bin/paddle_trainer...done.
(gdb) r
Starting program: /usr/opt/paddle/bin/paddle_trainer --config=vgg_16_mnist.py --dot_period=10 --log_period=100 --test_all_data_in_one_period=1 --use_gpu=1 --trainer_count=4 --num_passes=10 --save_dir=./mnist_vgg_model
[Thread debugging using libthread_db enabled]
Using host libthread_db library "/lib/x86_64-linux-gnu/libthread_db.so.1".
I0221 18:48:34.436648 29562 Util.cpp:155] commandline: /usr/opt/paddle/bin/paddle_trainer --config=vgg_16_mnist.py --dot_period=10 --log_period=100 --test_all_data_in_one_period=1 --use_gpu=1 --trainer_count=4 --num_passes=10 --save_dir=./mnist_vgg_model
[New Thread 0x7ffff3686700 (LWP 29567)]
[New Thread 0x7ffff2e85700 (LWP 29568)]
*** stack smashing detected ***: /usr/opt/paddle/bin/paddle_trainer terminated
Program received signal SIGABRT, Aborted.
0x00007ffff5cd0c37 in __GI_raise (sig=sig@entry=6) at ../nptl/sysdeps/unix/sysv/linux/raise.c:56
56 ../nptl/sysdeps/unix/sysv/linux/raise.c: No such file or directory.
(gdb) bt
#0 0x00007ffff5cd0c37 in __GI_raise (sig=sig@entry=6) at ../nptl/sysdeps/unix/sysv/linux/raise.c:56
#1 0x00007ffff5cd4028 in __GI_abort () at abort.c:89
#2 0x00007ffff5d0d2a4 in __libc_message (do_abort=do_abort@entry=1, fmt=fmt@entry=0x7ffff5e19113 "*** %s ***: %s terminated\n")
at ../sysdeps/posix/libc_fatal.c:175
#3 0x00007ffff5da4bbc in __GI___fortify_fail (msg=<optimized out>, msg@entry=0x7ffff5e190fb "stack smashing detected") at fortify_fail.c:38
#4 0x00007ffff5da4b60 in __stack_chk_fail () at stack_chk_fail.c:28
#5 0x00000000008954ce in hl_create_global_resources (device_prop=<optimized out>) at /root/paddle/paddle/cuda/src/hl_cuda_device.cc:499
#6 0x00000000008959f9 in hl_specify_devices_start (device=device@entry=0x0, number=18345040, number@entry=0)
at /root/paddle/paddle/cuda/src/hl_cuda_device.cc:593
#7 0x0000000000895d2d in hl_start () at /root/paddle/paddle/cuda/src/hl_cuda_device.cc:430
#8 0x0000000000818602 in paddle::initMain (argc=1, argc@entry=9, argv=argv@entry=0x7fffffffe528) at /root/paddle/paddle/utils/Util.cpp:179
#9 0x000000000052ac5b in main (argc=9, argv=0x7fffffffe528) at /root/paddle/paddle/trainer/TrainerMain.cpp:41