"docs/vscode:/vscode.git/clone" did not exist on "88a6f9dab5cc67b71d85a93a9d3f924879e33aa8"
make_paired_data.sh 370 Bytes
Newer Older
yangzhong's avatar
yangzhong committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
#!/bin/bash

# Define environment variables
export CUDA_VISIBLE_DEVICES="0"
export TOKENIZERS_PARALLELISM=false

# Define paths
INPUT_CSV=""
SAVE_PATH=""

# Run script on the full CSV file
torchrun --nnodes=1 --nproc_per_node=1 --master_port=29501 \
    make_paired_data.py \
    --config "./make_data_config.py" \
    --data-path $INPUT_CSV \
    --save_path $SAVE_PATH