baseten-admin commited on
Commit
5dec92f
·
verified ·
1 Parent(s): b1aff24

baseten-admin/gpt-oss-20b-multilingual-reasoner-e2e

Browse files
README.md CHANGED
@@ -4,8 +4,8 @@ library_name: transformers
4
  model_name: gpt-oss-20b-multilingual-reasoner
5
  tags:
6
  - generated_from_trainer
7
- - sft
8
  - trl
 
9
  licence: license
10
  ---
11
 
@@ -27,7 +27,7 @@ print(output["generated_text"])
27
 
28
  ## Training procedure
29
 
30
- [<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/philipkiely-baseten/huggingface/runs/11tap9lm)
31
 
32
 
33
  This model was trained with SFT.
 
4
  model_name: gpt-oss-20b-multilingual-reasoner
5
  tags:
6
  - generated_from_trainer
 
7
  - trl
8
+ - sft
9
  licence: license
10
  ---
11
 
 
27
 
28
  ## Training procedure
29
 
30
+ [<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/philipkiely-baseten/huggingface/runs/rgkdmqkl)
31
 
32
 
33
  This model was trained with SFT.
adapter_config.json CHANGED
@@ -28,10 +28,10 @@
28
  "rank_pattern": {},
29
  "revision": null,
30
  "target_modules": [
31
- "v_proj",
32
- "k_proj",
33
  "o_proj",
34
- "q_proj"
 
 
35
  ],
36
  "target_parameters": [
37
  "7.mlp.experts.gate_up_proj",
 
28
  "rank_pattern": {},
29
  "revision": null,
30
  "target_modules": [
 
 
31
  "o_proj",
32
+ "q_proj",
33
+ "k_proj",
34
+ "v_proj"
35
  ],
36
  "target_parameters": [
37
  "7.mlp.experts.gate_up_proj",
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7cfdf2c24c5b951d7a361a425307e19aa178394a47d7b19986b78c8b85f24d6f
3
  size 60189176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a76bc8736aaad5ce7dec89eb155ff35dac7e0700a0e9d5ac9f663b40b4e7233
3
  size 60189176
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:797f4b67ccad0feb5247bd5a007b2c3c8edb0de9415a1f699e51390656762d57
3
  size 6225
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:641a469654a61353a7935807fbda45fb5619169b26648f988a956b184bde304f
3
  size 6225