export CUDA_VISIBLE_DEVICES=0,1; python -m apex.parallel.multiproc main.py