config_cn.json 2.07 KB
Newer Older
1
2
3
4
{
  "language": "cn",
  "category": {
    "brainstorming": {
5
      "GPT": [
6
7
8
9
10
11
12
13
14
15
16
        "language organization",
        "relevance",
        "creativity",
        "practicality",
        "correctness"
      ],
      "Metrics": [
        "Distinct"
      ]
    },
    "chat": {
17
      "GPT": [
18
19
20
21
22
23
24
25
26
27
28
        "language organization",
        "relevance",
        "naturalness",
        "engagingness",
        "reasonableness"
      ],
      "Metrics": [
        "Distinct"
      ]
    },
    "classification": {
29
      "GPT": [
30
31
32
33
34
35
36
37
38
39
40
        "language organization",
        "relevance",
        "correctness"
      ],
      "Metrics": [
        "Precision",
        "Recall",
        "F1 score"
      ]
    },
    "closed_qa": {
41
      "GPT": [
42
43
44
45
46
47
48
49
50
51
52
        "language organization",
        "relevance",
        "correctness"
      ],
      "Metrics": [
        "BLEU",
        "ROUGE",
        "BERTScore"
      ]
    },
    "extraction": {
53
      "GPT": [
54
55
56
57
58
59
60
61
62
63
64
        "language organization",
        "relevance",
        "correctness"
      ],
      "Metrics": [
        "Precision",
        "Recall",
        "F1 score"
      ]
    },
    "generation": {
65
      "GPT": [
66
67
68
69
70
71
72
73
74
75
76
        "language organization",
        "relevance",
        "diversity"
      ],
      "Metrics": [
        "BLEU",
        "ROUGE",
        "BERTScore"
      ]
    },
    "open_qa": {
77
      "GPT": [
78
79
80
81
82
83
84
85
86
        "language organization",
        "relevance",
        "correctness"
      ],
      "Metrics": [
        "Distinct"
      ]
    },
    "rewriting": {
87
      "GPT": [
88
89
90
91
92
93
94
95
96
97
98
        "language organization",
        "relevance",
        "correctness"
      ],
      "Metrics": [
        "BLEU",
        "ROUGE",
        "BERTScore"
      ]
    },
    "roleplay": {
99
      "GPT": [
100
101
102
103
104
105
106
107
108
109
        "language organization",
        "relevance",
        "fidelity",
        "creativity"
      ],
      "Metrics": [
        "Distinct"
      ]
    },
    "summarization": {
110
      "GPT": [
111
112
113
114
115
116
117
118
119
120
121
122
123
        "language organization",
        "relevance",
        "correctness",
        "conciseness"
      ],
      "Metrics": [
        "BLEU",
        "ROUGE",
        "BERTScore"
      ]
    }
  }
}