python evaluate.py \--answer_file_list"path to answers of model 1""path to answers of model 2"\--prompt_file"path to prompt file"\--reviewer_file"path to reviewer file"\--output_folder"path to output folder"\--openai_key"your openai key"\--model"gpt-4"\--num_workers 8 \--max_tokens 512 \