Spaces:
Running
Running
Update app.py
Browse files
app.py
CHANGED
|
@@ -185,18 +185,24 @@ def evaluate_single_data(model_name, data, client, executor, prompt_template, pr
|
|
| 185 |
images_result = None
|
| 186 |
else:
|
| 187 |
output, report = exe_result
|
| 188 |
-
|
| 189 |
-
|
| 190 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 191 |
text_result = None
|
| 192 |
-
print("text result is none.")
|
| 193 |
-
try:
|
| 194 |
-
images_result = exe_result[0]['images']
|
| 195 |
-
except:
|
| 196 |
images_result = None
|
| 197 |
-
print("image result is none.")
|
| 198 |
|
| 199 |
-
messages, new_image_clue_idx = update_messages_with_excu_content(messages, images_result, text_result, image_clue_idx)
|
| 200 |
image_clue_idx = new_image_clue_idx
|
| 201 |
|
| 202 |
code_execution_count += 1
|
|
|
|
| 185 |
images_result = None
|
| 186 |
else:
|
| 187 |
output, report = exe_result
|
| 188 |
+
if report == "Done":
|
| 189 |
+
error_result = None
|
| 190 |
+
try:
|
| 191 |
+
text_result = exe_result[0]['text']
|
| 192 |
+
except:
|
| 193 |
+
text_result = None
|
| 194 |
+
print("text result is none.")
|
| 195 |
+
try:
|
| 196 |
+
images_result = exe_result[0]['images']
|
| 197 |
+
except:
|
| 198 |
+
images_result = None
|
| 199 |
+
print("image result is none.")
|
| 200 |
+
else:
|
| 201 |
+
error_result = report
|
| 202 |
text_result = None
|
|
|
|
|
|
|
|
|
|
|
|
|
| 203 |
images_result = None
|
|
|
|
| 204 |
|
| 205 |
+
messages, new_image_clue_idx = update_messages_with_excu_content(messages, images_result, text_result, error_result, image_clue_idx)
|
| 206 |
image_clue_idx = new_image_clue_idx
|
| 207 |
|
| 208 |
code_execution_count += 1
|