Commit 444f5993 authored by Taylor Robie's avatar Taylor Robie
Browse files

add unbuffer to run.sh as tee is causing issues

parent 4cdea1cc
#!/bin/bash #!/bin/bash
set -e set -e
if ! which unbuffer > /dev/null; then
echo "Could not find unbuffer command. Make sure the expect package is installed."
exit 1
fi
if [ `id -u` != 0 ]; then if [ `id -u` != 0 ]; then
echo "Calling sudo to gain root for this shell. (Needed to clear caches.)" echo "Calling sudo to gain root for this shell. (Needed to clear caches.)"
sudo echo "Success" sudo echo "Success"
...@@ -55,21 +60,22 @@ do ...@@ -55,21 +60,22 @@ do
# To reduce variation set the seed flag: # To reduce variation set the seed flag:
# --seed ${i} # --seed ${i}
python ncf_main.py --model_dir ${MODEL_DIR} \ unbuffer python ncf_main.py \
--data_dir ${DATA_DIR} \ --model_dir ${MODEL_DIR} \
--dataset ${DATASET} --hooks "" \ --data_dir ${DATA_DIR} \
${DEVICE_FLAG} \ --dataset ${DATASET} --hooks "" \
--clean \ ${DEVICE_FLAG} \
--train_epochs 14 \ --clean \
--batch_size 98304 \ --train_epochs 14 \
--eval_batch_size 160000 \ --batch_size 98304 \
--learning_rate 0.00382059 \ --eval_batch_size 160000 \
--beta1 0.783529 \ --learning_rate 0.00382059 \
--beta2 0.909003 \ --beta1 0.783529 \
--epsilon 1.45439e-07 \ --beta2 0.909003 \
--layers 256,256,128,64 --num_factors 64 \ --epsilon 1.45439e-07 \
--hr_threshold 0.635 \ --layers 256,256,128,64 --num_factors 64 \
--ml_perf \ --hr_threshold 0.635 \
--ml_perf \
|& tee ${RUN_LOG} \ |& tee ${RUN_LOG} \
| grep --line-buffered -E --regexp="(Iteration [0-9]+: HR = [0-9\.]+, NDCG = [0-9\.]+, Loss = [0-9\.]+)|(pipeline_hash)|(MLPerf time:)" | grep --line-buffered -E --regexp="(Iteration [0-9]+: HR = [0-9\.]+, NDCG = [0-9\.]+, Loss = [0-9\.]+)|(pipeline_hash)|(MLPerf time:)"
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment