baseten-admin commited on
Commit
03f5a34
·
verified ·
1 Parent(s): 9441bbb

baseten-admin/gpt-oss-20b-multilingual-reasoner

Browse files
README.md CHANGED
@@ -27,17 +27,17 @@ print(output["generated_text"])
27
 
28
  ## Training procedure
29
 
30
- [<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/philipkiely-baseten/huggingface/runs/efvevbg6)
31
 
32
 
33
  This model was trained with SFT.
34
 
35
  ### Framework versions
36
 
37
- - TRL: 0.24.0
38
  - Transformers: 4.57.1
39
  - Pytorch: 2.7.0+cu128
40
- - Datasets: 4.2.0
41
  - Tokenizers: 0.22.1
42
 
43
  ## Citations
 
27
 
28
  ## Training procedure
29
 
30
+
31
 
32
 
33
  This model was trained with SFT.
34
 
35
  ### Framework versions
36
 
37
+ - TRL: 0.25.1
38
  - Transformers: 4.57.1
39
  - Pytorch: 2.7.0+cu128
40
+ - Datasets: 4.4.1
41
  - Tokenizers: 0.22.1
42
 
43
  ## Citations
adapter_config.json CHANGED
@@ -28,10 +28,10 @@
28
  "rank_pattern": {},
29
  "revision": null,
30
  "target_modules": [
31
- "k_proj",
32
- "o_proj",
33
  "q_proj",
34
- "v_proj"
 
35
  ],
36
  "target_parameters": [
37
  "7.mlp.experts.gate_up_proj",
 
28
  "rank_pattern": {},
29
  "revision": null,
30
  "target_modules": [
31
+ "v_proj",
 
32
  "q_proj",
33
+ "k_proj",
34
+ "o_proj"
35
  ],
36
  "target_parameters": [
37
  "7.mlp.experts.gate_up_proj",
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5892c75dc318cd561e3b1ec3e32143ea1e9c8bbd4b9511b7290eb95ed288cfb4
3
  size 60189176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e4405c22b2a4d5be1a0c10689e9f10fd3e64cfaaad3a5c05475bcea6bbf74a71
3
  size 60189176
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:57a66f5e82167bb27f1d9d62120451b1e7349b7951e1700cec16a4153edfee63
3
  size 6289
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:26c55c21afeeed9d41d2d5843a7e3232bd43415ac8ab47ed3851fc1b68f3ba3d
3
  size 6289