forked from trpc-group/trpc-agent-python
-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathtrain.evalset.json
More file actions
112 lines (112 loc) · 3.19 KB
/
Copy pathtrain.evalset.json
File metadata and controls
112 lines (112 loc) · 3.19 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
{
"eval_set_id": "math_word_problems_train",
"name": "小学算术应用题 - 训练集",
"description": "5 道小学水平算术应用题,覆盖加法、乘法、折扣、百分比与「人/名」类单位;final_response 中带「答案:xxx」的标准答句供 contains 匹配,同时作为 LLM 裁判的参考答案。",
"eval_cases": [
{
"eval_id": "wp_apples_add",
"conversation": [
{
"invocation_id": "t1",
"user_content": {
"parts": [{"text": "小明早上买了 4 个苹果,下午又买了 7 个苹果,他一共有多少个苹果?"}],
"role": "user"
},
"final_response": {
"parts": [{"text": "答案:11 个"}],
"role": "model"
}
}
],
"session_input": {
"app_name": "math_word_problem_optimizer",
"user_id": "trainer",
"state": {}
}
},
{
"eval_id": "wp_car_distance",
"conversation": [
{
"invocation_id": "t2",
"user_content": {
"parts": [{"text": "一辆汽车以每小时 60 公里的速度行驶 2.5 小时,一共行驶了多少公里?"}],
"role": "user"
},
"final_response": {
"parts": [{"text": "答案:150 公里"}],
"role": "model"
}
}
],
"session_input": {
"app_name": "math_word_problem_optimizer",
"user_id": "trainer",
"state": {}
}
},
{
"eval_id": "wp_discount_price",
"conversation": [
{
"invocation_id": "t3",
"user_content": {
"parts": [{"text": "一件衣服原价 200 元,现在打 8 折出售,折后价是多少元?"}],
"role": "user"
},
"final_response": {
"parts": [{"text": "答案:160 元"}],
"role": "model"
}
}
],
"session_input": {
"app_name": "math_word_problem_optimizer",
"user_id": "trainer",
"state": {}
}
},
{
"eval_id": "wp_glasses_percent",
"conversation": [
{
"invocation_id": "t4",
"user_content": {
"parts": [{"text": "班里一共有 40 名学生,其中 25% 戴眼镜,戴眼镜的有多少人?"}],
"role": "user"
},
"final_response": {
"parts": [{"text": "答案:10 人"}],
"role": "model"
}
}
],
"session_input": {
"app_name": "math_word_problem_optimizer",
"user_id": "trainer",
"state": {}
}
},
{
"eval_id": "wp_defect_items_percent",
"conversation": [
{
"invocation_id": "t5",
"user_content": {
"parts": [{"text": "一批商品共 50 件,其中 30% 是次品,次品有多少件?"}],
"role": "user"
},
"final_response": {
"parts": [{"text": "答案:15 件"}],
"role": "model"
}
}
],
"session_input": {
"app_name": "math_word_problem_optimizer",
"user_id": "trainer",
"state": {}
}
}
]
}