Remove redundant training data notes from comments
Browse files
results/A3-Qwen3.5-9B/miniwob.json
CHANGED
|
@@ -10,7 +10,7 @@
|
|
| 10 |
"benchmark_tuned": "No",
|
| 11 |
"followed_evaluation_protocol": "Yes",
|
| 12 |
"reproducible": "Yes",
|
| 13 |
-
"comments": "625 tasks. Fine-tuned on A3-Synth trajectories via the Agent-as-Annotators framework.
|
| 14 |
"original_or_reproduced": "Original"
|
| 15 |
}
|
| 16 |
]
|
|
|
|
| 10 |
"benchmark_tuned": "No",
|
| 11 |
"followed_evaluation_protocol": "Yes",
|
| 12 |
"reproducible": "Yes",
|
| 13 |
+
"comments": "625 tasks. Fine-tuned on A3-Synth trajectories via the Agent-as-Annotators framework.",
|
| 14 |
"original_or_reproduced": "Original"
|
| 15 |
}
|
| 16 |
]
|
results/A3-Qwen3.5-9B/workarena-l1.json
CHANGED
|
@@ -10,7 +10,7 @@
|
|
| 10 |
"benchmark_tuned": "No",
|
| 11 |
"followed_evaluation_protocol": "Yes",
|
| 12 |
"reproducible": "Yes",
|
| 13 |
-
"comments": "330 tasks. Fine-tuned on A3-Synth trajectories via the Agent-as-Annotators framework.
|
| 14 |
"original_or_reproduced": "Original"
|
| 15 |
}
|
| 16 |
]
|
|
|
|
| 10 |
"benchmark_tuned": "No",
|
| 11 |
"followed_evaluation_protocol": "Yes",
|
| 12 |
"reproducible": "Yes",
|
| 13 |
+
"comments": "330 tasks. Fine-tuned on A3-Synth trajectories via the Agent-as-Annotators framework.",
|
| 14 |
"original_or_reproduced": "Original"
|
| 15 |
}
|
| 16 |
]
|
results/A3-Qwen3.5-9B/workarena-l2.json
CHANGED
|
@@ -10,7 +10,7 @@
|
|
| 10 |
"benchmark_tuned": "No",
|
| 11 |
"followed_evaluation_protocol": "Yes",
|
| 12 |
"reproducible": "Yes",
|
| 13 |
-
"comments": "341 tasks (full benchmark). Fine-tuned on A3-Synth trajectories via the Agent-as-Annotators framework.
|
| 14 |
"original_or_reproduced": "Original"
|
| 15 |
}
|
| 16 |
]
|
|
|
|
| 10 |
"benchmark_tuned": "No",
|
| 11 |
"followed_evaluation_protocol": "Yes",
|
| 12 |
"reproducible": "Yes",
|
| 13 |
+
"comments": "341 tasks (full benchmark). Fine-tuned on A3-Synth trajectories via the Agent-as-Annotators framework.",
|
| 14 |
"original_or_reproduced": "Original"
|
| 15 |
}
|
| 16 |
]
|