"applications/Chat/examples/ray/mmmt_prompt.py" did not exist on "41fb7236aa32c307e83b0b9cc50ce2a6da279343"
format_questions.py 988 Bytes
Newer Older
Yuanchen's avatar
Yuanchen committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
import argparse
import os
import json
import copy

from utils import jdump, get_json_list


def format_questions(args):
    questions = get_json_list(args.questions_path)
    keys=questions[0].keys()
    
    formatted_questions=copy.deepcopy(questions)
    for i in range(len(formatted_questions)):
        formatted_questions[i]['instruction']=questions[i]['text']
        formatted_questions[i]['input']=""
        formatted_questions[i]['output']=""
        formatted_questions[i]['id']=questions[i]['question_id']
        for key in keys:
            if key=="category":
                continue
            del formatted_questions[i][key]
    
    jdump(formatted_questions, args.save_path)

if __name__ == '__main__':
    parser = argparse.ArgumentParser()
    parser.add_argument('--questions_path', type=str, default='table/question.jsonl')
    parser.add_argument('--save_path', type=str, default="table/questions.json")
    args = parser.parse_args()
    format_questions(args)