elliotthwangmsa commited on
Commit
1d979b8
·
verified ·
1 Parent(s): 63f7188

elliotthwangmsa/gemma-3-270m-train_ouputs

Browse files
README.md CHANGED
@@ -34,11 +34,11 @@ This model was trained with SFT.
34
 
35
  ### Framework versions
36
 
37
- - TRL: 0.21.0
38
- - Transformers: 4.55.4
39
  - Pytorch: 2.8.0+cu126
40
  - Datasets: 4.0.0
41
- - Tokenizers: 0.21.4
42
 
43
  ## Citations
44
 
 
34
 
35
  ### Framework versions
36
 
37
+ - TRL: 0.22.1
38
+ - Transformers: 4.56.0
39
  - Pytorch: 2.8.0+cu126
40
  - Datasets: 4.0.0
41
+ - Tokenizers: 0.22.0
42
 
43
  ## Citations
44
 
adapter_config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "alpha_pattern": {},
3
  "auto_mapping": null,
4
- "base_model_name_or_path": null,
5
  "bias": "none",
6
  "corda_config": null,
7
  "eva_config": null,
@@ -25,9 +25,9 @@
25
  "rank_pattern": {},
26
  "revision": null,
27
  "target_modules": [
28
- "k_proj",
29
  "v_proj",
30
  "o_proj",
 
31
  "q_proj"
32
  ],
33
  "target_parameters": null,
 
1
  {
2
  "alpha_pattern": {},
3
  "auto_mapping": null,
4
+ "base_model_name_or_path": "google/gemma-3-270m",
5
  "bias": "none",
6
  "corda_config": null,
7
  "eva_config": null,
 
25
  "rank_pattern": {},
26
  "revision": null,
27
  "target_modules": [
 
28
  "v_proj",
29
  "o_proj",
30
+ "k_proj",
31
  "q_proj"
32
  ],
33
  "target_parameters": null,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4e3a9454473cff5327ccf68e267b9ec370d9fc9284e4d337a2246d13d4b52412
3
- size 2970320
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1055878f8762de53ec39b267dc952cdbb32079c7c57bf08562292c508c11bf38
3
+ size 2967872
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:14b8b2b6127b54d73035fa32a971b86149887109ffdae891c3e7bc7a2a9f67bb
3
  size 6161
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:948434fa5a1668c5d52e9d442848e64d73163e1128da80bc23e9ecf52bc914bc
3
  size 6161