2023-05-24 03:18:23 +00:00
|
|
|
{
|
|
|
|
"language": "cn",
|
|
|
|
"category": {
|
|
|
|
"brainstorming": {
|
2023-05-30 03:48:41 +00:00
|
|
|
"GPT": [
|
2023-05-24 03:18:23 +00:00
|
|
|
"language organization",
|
|
|
|
"relevance",
|
|
|
|
"creativity",
|
|
|
|
"practicality",
|
|
|
|
"correctness"
|
|
|
|
],
|
|
|
|
"Metrics": [
|
|
|
|
"Distinct"
|
|
|
|
]
|
|
|
|
},
|
|
|
|
"chat": {
|
2023-05-30 03:48:41 +00:00
|
|
|
"GPT": [
|
2023-05-24 03:18:23 +00:00
|
|
|
"language organization",
|
|
|
|
"relevance",
|
|
|
|
"naturalness",
|
|
|
|
"engagingness",
|
|
|
|
"reasonableness"
|
|
|
|
],
|
|
|
|
"Metrics": [
|
|
|
|
"Distinct"
|
|
|
|
]
|
|
|
|
},
|
|
|
|
"classification": {
|
2023-05-30 03:48:41 +00:00
|
|
|
"GPT": [
|
2023-05-24 03:18:23 +00:00
|
|
|
"language organization",
|
|
|
|
"relevance",
|
|
|
|
"correctness"
|
|
|
|
],
|
|
|
|
"Metrics": [
|
|
|
|
"Precision",
|
|
|
|
"Recall",
|
|
|
|
"F1 score"
|
|
|
|
]
|
|
|
|
},
|
|
|
|
"closed_qa": {
|
2023-05-30 03:48:41 +00:00
|
|
|
"GPT": [
|
2023-05-24 03:18:23 +00:00
|
|
|
"language organization",
|
|
|
|
"relevance",
|
|
|
|
"correctness"
|
|
|
|
],
|
|
|
|
"Metrics": [
|
|
|
|
"BLEU",
|
|
|
|
"ROUGE",
|
|
|
|
"BERTScore"
|
|
|
|
]
|
|
|
|
},
|
|
|
|
"extraction": {
|
2023-05-30 03:48:41 +00:00
|
|
|
"GPT": [
|
2023-05-24 03:18:23 +00:00
|
|
|
"language organization",
|
|
|
|
"relevance",
|
|
|
|
"correctness"
|
|
|
|
],
|
|
|
|
"Metrics": [
|
|
|
|
"Precision",
|
|
|
|
"Recall",
|
|
|
|
"F1 score"
|
|
|
|
]
|
|
|
|
},
|
|
|
|
"generation": {
|
2023-05-30 03:48:41 +00:00
|
|
|
"GPT": [
|
2023-05-24 03:18:23 +00:00
|
|
|
"language organization",
|
|
|
|
"relevance",
|
|
|
|
"diversity"
|
|
|
|
],
|
|
|
|
"Metrics": [
|
|
|
|
"BLEU",
|
|
|
|
"ROUGE",
|
|
|
|
"BERTScore"
|
|
|
|
]
|
|
|
|
},
|
|
|
|
"open_qa": {
|
2023-05-30 03:48:41 +00:00
|
|
|
"GPT": [
|
2023-05-24 03:18:23 +00:00
|
|
|
"language organization",
|
|
|
|
"relevance",
|
|
|
|
"correctness"
|
|
|
|
],
|
|
|
|
"Metrics": [
|
|
|
|
"Distinct"
|
|
|
|
]
|
|
|
|
},
|
|
|
|
"rewriting": {
|
2023-05-30 03:48:41 +00:00
|
|
|
"GPT": [
|
2023-05-24 03:18:23 +00:00
|
|
|
"language organization",
|
|
|
|
"relevance",
|
|
|
|
"correctness"
|
|
|
|
],
|
|
|
|
"Metrics": [
|
|
|
|
"BLEU",
|
|
|
|
"ROUGE",
|
|
|
|
"BERTScore"
|
|
|
|
]
|
|
|
|
},
|
|
|
|
"roleplay": {
|
2023-05-30 03:48:41 +00:00
|
|
|
"GPT": [
|
2023-05-24 03:18:23 +00:00
|
|
|
"language organization",
|
|
|
|
"relevance",
|
|
|
|
"fidelity",
|
|
|
|
"creativity"
|
|
|
|
],
|
|
|
|
"Metrics": [
|
|
|
|
"Distinct"
|
|
|
|
]
|
|
|
|
},
|
|
|
|
"summarization": {
|
2023-05-30 03:48:41 +00:00
|
|
|
"GPT": [
|
2023-05-24 03:18:23 +00:00
|
|
|
"language organization",
|
|
|
|
"relevance",
|
|
|
|
"correctness",
|
|
|
|
"conciseness"
|
|
|
|
],
|
|
|
|
"Metrics": [
|
|
|
|
"BLEU",
|
|
|
|
"ROUGE",
|
|
|
|
"BERTScore"
|
|
|
|
]
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|