Spaces:
Sleeping
Sleeping
Fix metric.run_metric out of the try-except-else (#33)
Browse files- Fix metric.run_metric out of the try-except-else (58e1e43f19dda84e0d3616912158f0a5b9253df8)
Co-authored-by: Francesco Giannuzzo <[email protected]>
- utilities.py +7 -2
utilities.py
CHANGED
@@ -185,13 +185,18 @@ def evaluate_answer(df):
|
|
185 |
target = row["target_answer"]
|
186 |
predicted = row["predicted_answer"]
|
187 |
try:
|
188 |
-
|
189 |
except Exception as e:
|
190 |
-
result =
|
|
|
|
|
191 |
results.append(result)
|
192 |
df[metric_name] = results
|
193 |
return df
|
194 |
|
|
|
|
|
|
|
195 |
models = [
|
196 |
"gpt-4o-mini",
|
197 |
"deepseek-ai/DeepSeek-R1-Distill-Llama-70B",
|
|
|
185 |
target = row["target_answer"]
|
186 |
predicted = row["predicted_answer"]
|
187 |
try:
|
188 |
+
predicted = eval(predicted)
|
189 |
except Exception as e:
|
190 |
+
result = 0
|
191 |
+
else:
|
192 |
+
result = metric.run_metric(target = target, prediction = predicted)
|
193 |
results.append(result)
|
194 |
df[metric_name] = results
|
195 |
return df
|
196 |
|
197 |
+
|
198 |
+
|
199 |
+
|
200 |
models = [
|
201 |
"gpt-4o-mini",
|
202 |
"deepseek-ai/DeepSeek-R1-Distill-Llama-70B",
|