xhluca commited on
Commit
d7a5d72
·
verified ·
1 Parent(s): 91c446a

Remove redundant training data notes from comments

Browse files
results/A3-Qwen3.5-9B/miniwob.json CHANGED
@@ -10,7 +10,7 @@
10
  "benchmark_tuned": "No",
11
  "followed_evaluation_protocol": "Yes",
12
  "reproducible": "Yes",
13
- "comments": "625 tasks. Fine-tuned on A3-Synth trajectories via the Agent-as-Annotators framework. Not trained on MiniWoB data.",
14
  "original_or_reproduced": "Original"
15
  }
16
  ]
 
10
  "benchmark_tuned": "No",
11
  "followed_evaluation_protocol": "Yes",
12
  "reproducible": "Yes",
13
+ "comments": "625 tasks. Fine-tuned on A3-Synth trajectories via the Agent-as-Annotators framework.",
14
  "original_or_reproduced": "Original"
15
  }
16
  ]
results/A3-Qwen3.5-9B/workarena-l1.json CHANGED
@@ -10,7 +10,7 @@
10
  "benchmark_tuned": "No",
11
  "followed_evaluation_protocol": "Yes",
12
  "reproducible": "Yes",
13
- "comments": "330 tasks. Fine-tuned on A3-Synth trajectories via the Agent-as-Annotators framework. Not trained on ServiceNow data.",
14
  "original_or_reproduced": "Original"
15
  }
16
  ]
 
10
  "benchmark_tuned": "No",
11
  "followed_evaluation_protocol": "Yes",
12
  "reproducible": "Yes",
13
+ "comments": "330 tasks. Fine-tuned on A3-Synth trajectories via the Agent-as-Annotators framework.",
14
  "original_or_reproduced": "Original"
15
  }
16
  ]
results/A3-Qwen3.5-9B/workarena-l2.json CHANGED
@@ -10,7 +10,7 @@
10
  "benchmark_tuned": "No",
11
  "followed_evaluation_protocol": "Yes",
12
  "reproducible": "Yes",
13
- "comments": "341 tasks (full benchmark). Fine-tuned on A3-Synth trajectories via the Agent-as-Annotators framework. Not trained on ServiceNow data.",
14
  "original_or_reproduced": "Original"
15
  }
16
  ]
 
10
  "benchmark_tuned": "No",
11
  "followed_evaluation_protocol": "Yes",
12
  "reproducible": "Yes",
13
+ "comments": "341 tasks (full benchmark). Fine-tuned on A3-Synth trajectories via the Agent-as-Annotators framework.",
14
  "original_or_reproduced": "Original"
15
  }
16
  ]