taozhang9527 commited on
Commit
5d8a29d
·
verified ·
1 Parent(s): 62473b1

Training in progress, step 21

Browse files
Files changed (4) hide show
  1. README.md +3 -3
  2. config.json +2 -2
  3. model.safetensors +1 -1
  4. training_args.bin +1 -1
README.md CHANGED
@@ -1,17 +1,17 @@
1
  ---
2
- base_model: Qwen/Qwen3-1.7B
3
  library_name: transformers
4
  model_name: wordle-grpo-Qwen3-1.7B-test
5
  tags:
6
  - generated_from_trainer
7
- - grpo
8
  - trl
 
9
  licence: license
10
  ---
11
 
12
  # Model Card for wordle-grpo-Qwen3-1.7B-test
13
 
14
- This model is a fine-tuned version of [Qwen/Qwen3-1.7B](https://huggingface.co/Qwen/Qwen3-1.7B).
15
  It has been trained using [TRL](https://github.com/huggingface/trl).
16
 
17
  ## Quick start
 
1
  ---
2
+ base_model: Qwen/Qwen3-0.6B
3
  library_name: transformers
4
  model_name: wordle-grpo-Qwen3-1.7B-test
5
  tags:
6
  - generated_from_trainer
 
7
  - trl
8
+ - grpo
9
  licence: license
10
  ---
11
 
12
  # Model Card for wordle-grpo-Qwen3-1.7B-test
13
 
14
+ This model is a fine-tuned version of [Qwen/Qwen3-0.6B](https://huggingface.co/Qwen/Qwen3-0.6B).
15
  It has been trained using [TRL](https://github.com/huggingface/trl).
16
 
17
  ## Quick start
config.json CHANGED
@@ -8,9 +8,9 @@
8
  "eos_token_id": 151645,
9
  "head_dim": 128,
10
  "hidden_act": "silu",
11
- "hidden_size": 2048,
12
  "initializer_range": 0.02,
13
- "intermediate_size": 6144,
14
  "layer_types": [
15
  "full_attention",
16
  "full_attention",
 
8
  "eos_token_id": 151645,
9
  "head_dim": 128,
10
  "hidden_act": "silu",
11
+ "hidden_size": 1024,
12
  "initializer_range": 0.02,
13
+ "intermediate_size": 3072,
14
  "layer_types": [
15
  "full_attention",
16
  "full_attention",
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d78fa6a47cb4f5f9addfaa17aeba8eec9f6d20fdc1a67169a30dbdaa9b007907
3
  size 2384234968
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff3bb35cde188872d394f445a97568c67570c2d31ae8361a78f9607d63b8555a
3
  size 2384234968
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d3d0c42e59afe4bca16ba2be40f88364248227c37e50bf9fe877aec2ff4ef909
3
  size 7697
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:33dcaf4ae329691abb1c3990f1902c0856dd75ca3679897084998996c5de30ad
3
  size 7697