Commit 2bfc27eb by ccran

feat: 增加测试结果;

parent 07aaa16d
......@@ -208,7 +208,6 @@ def filter_rows_by_llm_result(
continue
ground_truth_text = str(ground_truth).strip()
ground_truth_text = '合格'
try:
for attempt in Retrying(wait=wait_fixed(1), stop=stop_after_attempt(max_retries), reraise=True):
......@@ -231,7 +230,7 @@ def filter_rows_by_llm_result(
)
raise ValueError("llm result mismatch")
print(f"[llm_match] row={index}, attempt={attempt.retry_state.attempt_number},result={result_text}")
row['rsp'] = f'<think>{reasoning_content}</think>{result_text}'
row['rsp'] = f'<think>{reasoning_content}</think>{content}'
except Exception as exc:
row['rsp'] = ''
print(f"[llm_drop] row={index}, error={exc}")
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or sign in to comment