@@ -2140,4 +2140,56 @@ evaluator_template_conf_en-US:
2140
2140
prompt_source_type : 1
2141
2141
prompt_template_key : builtin_template_detail
2142
2142
prompt_template_name : " Detail"
2143
+ receive_chat_history : false
2144
+
2145
+ code_evaluator_template_conf :
2146
+ equals_checker :
2147
+ Python :
2148
+ receive_chat_history : false
2149
+ code_evaluator :
2150
+ language_type : " Python"
2151
+ code_content : " def exec_evaluation(turn_data):\n try:\n # 获取实际输出和参考输出\n actual_text = turn_data[\" turn\" ][\" eval_target\" ][\" actual_output\" ][\" text\" ]\n reference_text = turn_data[\" turn\" ][\" eval_set\" ][\" reference_output\" ][\" text\" ]\n \n # 比较文本相似性或相等性\n is_equal = actual_text.strip() == reference_text.strip()\n score = 1.0 if is_equal else 0.0\n \n if is_equal:\n status = \" 匹配\"\n else:\n status = \" 不匹配\"\n reason = f\" 实际输出与参考输出{status}。实际输出: '{actual_text}', 参考输出: '{reference_text}'\"\n \n return EvalOutput(score=score, reason=reason, err_msg=\"\" )\n \n except KeyError as e:\n return EvalOutput(score=0.0, reason=f\" 字段路径未找到: {e}\" , err_msg=str(e))\n except Exception as e:\n return EvalOutput(score=0.0, reason=f\" 评估失败: {e}\" , err_msg=str(e))"
2152
+ code_template_key : " equals_checker"
2153
+ code_template_name : " 相等性检查器"
2154
+ Python3 :
2155
+ receive_chat_history : false
2156
+ code_evaluator :
2157
+ language_type : " Python3"
2158
+ code_content : " def exec_evaluation(turn_data):\n try:\n # 获取实际输出和参考输出\n actual_text = turn_data[\" turn\" ][\" eval_target\" ][\" actual_output\" ][\" text\" ]\n reference_text = turn_data[\" turn\" ][\" eval_set\" ][\" reference_output\" ][\" text\" ]\n \n # 比较文本相似性或相等性\n is_equal = actual_text.strip() == reference_text.strip()\n score = 1.0 if is_equal else 0.0\n \n if is_equal:\n status = \" 匹配\"\n else:\n status = \" 不匹配\"\n reason = f\" 实际输出与参考输出{status}。实际输出: '{actual_text}', 参考输出: '{reference_text}'\"\n \n return EvalOutput(score=score, reason=reason, err_msg=\"\" )\n \n except KeyError as e:\n return EvalOutput(score=0.0, reason=f\" 字段路径未找到: {e}\" , err_msg=str(e))\n except Exception as e:\n return EvalOutput(score=0.0, reason=f\" 评估失败: {e}\" , err_msg=str(e))"
2159
+ code_template_key : " equals_checker"
2160
+ code_template_name : " 相等性检查器"
2161
+ contains_checker :
2162
+ JavaScript :
2163
+ receive_chat_history : false
2164
+ input_schemas :
2165
+ - name : " input"
2166
+ type : " string"
2167
+ description : " 评估输入内容"
2168
+ - name : " reference_output"
2169
+ type : " string"
2170
+ description : " 参考输出内容"
2171
+ - name : " actual_output"
2172
+ type : " string"
2173
+ description : " 实际输出内容"
2174
+ code_evaluator :
2175
+ language_type : " JavaScript"
2176
+ code_content : " function execEvaluation(turnData) {\n try {\n // 获取实际输出和参考输出\n const actualText = turnData.turn.eval_target.actual_output.text;\n const referenceText = turnData.turn.eval_set.reference_output.text;\n \n // 检查实际输出是否包含参考输出\n const contains = actualText.includes(referenceText);\n const score = contains ? 1.0 : 0.0;\n \n const status = contains ? \" 包含\" : \" 不包含\" ;\n const reason = `实际输出${status}参考输出。实际输出: '${actualText}', 参考输出: '${referenceText}'`;\n \n return { score: score, reason: reason, err_msg: \"\" };\n \n } catch (e) {\n return { score: 0.0, reason: `评估失败: ${e.message}`, err_msg: e.message };\n }\n }"
2177
+ code_template_key : " contains_checker"
2178
+ code_template_name : " 包含性检查器"
2179
+ JS :
2143
2180
receive_chat_history : false
2181
+ input_schemas :
2182
+ - name : " input"
2183
+ type : " string"
2184
+ description : " 评估输入内容"
2185
+ - name : " reference_output"
2186
+ type : " string"
2187
+ description : " 参考输出内容"
2188
+ - name : " actual_output"
2189
+ type : " string"
2190
+ description : " 实际输出内容"
2191
+ code_evaluator :
2192
+ language_type : " JS"
2193
+ code_content : " function execEvaluation(turnData) {\n try {\n // 获取实际输出和参考输出\n const actualText = turnData.turn.eval_target.actual_output.text;\n const referenceText = turnData.turn.eval_set.reference_output.text;\n \n // 检查实际输出是否包含参考输出\n const contains = actualText.includes(referenceText);\n const score = contains ? 1.0 : 0.0;\n \n const status = contains ? \" 包含\" : \" 不包含\" ;\n const reason = `实际输出${status}参考输出。实际输出: '${actualText}', 参考输出: '${referenceText}'`;\n \n return { score: score, reason: reason, err_msg: \"\" };\n \n } catch (e) {\n return { score: 0.0, reason: `评估失败: ${e.message}`, err_msg: e.message };\n }\n }"
2194
+ code_template_key : " contains_checker"
2195
+ code_template_name : " 包含性检查器" e
0 commit comments