mirror of https://github.com/hpcaitech/ColossalAI
You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
205 lines
3.2 KiB
205 lines
3.2 KiB
{
|
|
"language": "cn",
|
|
"category": {
|
|
"brainstorming": {
|
|
"GPT": [
|
|
"language organization",
|
|
"relevance",
|
|
"creativity",
|
|
"practicality",
|
|
"reasonableness"
|
|
],
|
|
"Metrics": [
|
|
"Distinct"
|
|
]
|
|
},
|
|
"chat": {
|
|
"GPT": [
|
|
"language organization",
|
|
"naturalness",
|
|
"engagingness",
|
|
"fidelity"
|
|
],
|
|
"Metrics": [
|
|
"Distinct"
|
|
]
|
|
},
|
|
"classification": {
|
|
"GPT": [
|
|
"relevance",
|
|
"correctness"
|
|
],
|
|
"Metrics": [
|
|
"Precision",
|
|
"Recall",
|
|
"F1 score",
|
|
"CHRF"
|
|
]
|
|
},
|
|
"closed_qa": {
|
|
"GPT": [
|
|
"relevance",
|
|
"correctness"
|
|
],
|
|
"Metrics": [
|
|
"BLEU",
|
|
"ROUGE",
|
|
"BERTScore",
|
|
"CHRF"
|
|
]
|
|
},
|
|
"extraction": {
|
|
"GPT": [
|
|
"relevance",
|
|
"correctness"
|
|
],
|
|
"Metrics": [
|
|
"Precision",
|
|
"Recall",
|
|
"F1 score",
|
|
"CHRF"
|
|
]
|
|
},
|
|
"generation": {
|
|
"GPT": [
|
|
"language organization",
|
|
"relevance",
|
|
"diversity"
|
|
],
|
|
"Metrics": [
|
|
"BLEU",
|
|
"ROUGE",
|
|
"BERTScore"
|
|
]
|
|
},
|
|
"logical_reasoning": {
|
|
"GPT": [
|
|
"correctness",
|
|
"relevance",
|
|
"reasonableness"
|
|
],
|
|
"Metrics": [
|
|
"BLEU",
|
|
"ROUGE",
|
|
"BERTScore",
|
|
"CHRF"
|
|
]
|
|
},
|
|
"open_qa": {
|
|
"GPT": [
|
|
"language organization",
|
|
"relevance",
|
|
"correctness"
|
|
],
|
|
"Metrics": [
|
|
"Distinct"
|
|
]
|
|
},
|
|
"rewriting": {
|
|
"GPT": [
|
|
"language organization",
|
|
"relevance",
|
|
"correctness"
|
|
],
|
|
"Metrics": [
|
|
"BLEU",
|
|
"ROUGE",
|
|
"BERTScore"
|
|
]
|
|
},
|
|
"roleplay": {
|
|
"GPT": [
|
|
"language organization",
|
|
"relevance",
|
|
"fidelity",
|
|
"creativity"
|
|
],
|
|
"Metrics": [
|
|
"Distinct"
|
|
]
|
|
},
|
|
"summarization": {
|
|
"GPT": [
|
|
"language organization",
|
|
"relevance",
|
|
"correctness",
|
|
"conciseness"
|
|
],
|
|
"Metrics": [
|
|
]
|
|
},
|
|
"Finance": {
|
|
"GPT": [
|
|
"relevance",
|
|
"correctness"
|
|
],
|
|
"Metrics": [
|
|
]
|
|
},
|
|
"Law": {
|
|
"GPT": [
|
|
"relevance",
|
|
"correctness"
|
|
],
|
|
"Metrics": [
|
|
]
|
|
},
|
|
"Education": {
|
|
"GPT": [
|
|
"relevance",
|
|
"correctness"
|
|
],
|
|
"Metrics": [
|
|
]
|
|
},
|
|
"Medical": {
|
|
"GPT": [
|
|
"relevance",
|
|
"correctness"
|
|
],
|
|
"Metrics": [
|
|
]
|
|
},
|
|
"STEM": {
|
|
"GPT": [
|
|
"relevance",
|
|
"correctness"
|
|
],
|
|
"Metrics": [
|
|
]
|
|
},
|
|
"SocialScience": {
|
|
"GPT": [
|
|
"relevance",
|
|
"correctness"
|
|
],
|
|
"Metrics": [
|
|
]
|
|
},
|
|
"Humanity": {
|
|
"GPT": [
|
|
"relevance",
|
|
"correctness"
|
|
],
|
|
"Metrics": [
|
|
]
|
|
},
|
|
"Other": {
|
|
"GPT": [
|
|
"relevance",
|
|
"correctness"
|
|
],
|
|
"Metrics": [
|
|
]
|
|
},
|
|
"ethics": {
|
|
"GPT": [
|
|
"relevance",
|
|
"correctness"
|
|
],
|
|
"Metrics": [
|
|
]
|
|
}
|
|
}
|
|
}
|