config_cn.json 2.14 KB
Newer Older
1
2
3
4
{
  "language": "cn",
  "category": {
    "brainstorming": {
5
      "GPT": [
6
7
8
9
        "language organization",
        "relevance",
        "creativity",
        "practicality",
10
        "reasonableness"
11
12
13
14
15
16
      ],
      "Metrics": [
        "Distinct"
      ]
    },
    "chat": {
17
      "GPT": [
18
19
20
21
22
23
24
25
26
27
28
        "language organization",
        "relevance",
        "naturalness",
        "engagingness",
        "reasonableness"
      ],
      "Metrics": [
        "Distinct"
      ]
    },
    "classification": {
29
      "GPT": [
30
31
32
33
34
35
36
        "language organization",
        "relevance",
        "correctness"
      ],
      "Metrics": [
        "Precision",
        "Recall",
37
38
        "F1 score",
        "CHRF"
39
40
41
      ]
    },
    "closed_qa": {
42
      "GPT": [
43
44
45
46
47
48
49
        "language organization",
        "relevance",
        "correctness"
      ],
      "Metrics": [
        "BLEU",
        "ROUGE",
50
51
        "BERTScore",
        "CHRF"
52
53
54
      ]
    },
    "extraction": {
55
      "GPT": [
56
57
58
59
60
61
62
        "language organization",
        "relevance",
        "correctness"
      ],
      "Metrics": [
        "Precision",
        "Recall",
63
64
        "F1 score",
        "CHRF"
65
66
67
      ]
    },
    "generation": {
68
      "GPT": [
69
70
71
72
73
74
75
76
77
78
79
        "language organization",
        "relevance",
        "diversity"
      ],
      "Metrics": [
        "BLEU",
        "ROUGE",
        "BERTScore"
      ]
    },
    "open_qa": {
80
      "GPT": [
81
82
83
84
85
86
87
88
89
        "language organization",
        "relevance",
        "correctness"
      ],
      "Metrics": [
        "Distinct"
      ]
    },
    "rewriting": {
90
      "GPT": [
91
92
93
94
95
96
97
98
99
100
101
        "language organization",
        "relevance",
        "correctness"
      ],
      "Metrics": [
        "BLEU",
        "ROUGE",
        "BERTScore"
      ]
    },
    "roleplay": {
102
      "GPT": [
103
104
105
106
107
108
109
110
111
112
        "language organization",
        "relevance",
        "fidelity",
        "creativity"
      ],
      "Metrics": [
        "Distinct"
      ]
    },
    "summarization": {
113
      "GPT": [
114
115
116
117
118
119
120
121
        "language organization",
        "relevance",
        "correctness",
        "conciseness"
      ],
      "Metrics": [
        "BLEU",
        "ROUGE",
122
123
        "BERTScore",
        "CHRF"
124
125
126
127
      ]
    }
  }
}