ambrosfitz commited on
Commit
5ec9df2
·
verified ·
1 Parent(s): 25be6e7

Upload training_metrics.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. training_metrics.json +14 -0
training_metrics.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "base_model": "Qwen/Qwen2.5-1.5B-Instruct",
3
+ "training_method": "GRPO with Unsloth",
4
+ "dataset_size": 1602,
5
+ "training_steps": 360,
6
+ "final_reward": 3.17,
7
+ "improvement": "+67%",
8
+ "key_achievements": [
9
+ "Foreign language bias detection",
10
+ "Structured reasoning output",
11
+ "67% reward improvement",
12
+ "46% reduction in output variance"
13
+ ]
14
+ }