dandan04 commited on
Commit
6039483
·
verified ·
1 Parent(s): 2e4153e

Training in progress, epoch 1

Browse files
README.md CHANGED
@@ -4,8 +4,8 @@ library_name: transformers
4
  model_name: medgemma-4b-it-sft-lora-crc100k
5
  tags:
6
  - generated_from_trainer
7
- - trl
8
  - sft
 
9
  licence: license
10
  ---
11
 
 
4
  model_name: medgemma-4b-it-sft-lora-crc100k
5
  tags:
6
  - generated_from_trainer
 
7
  - sft
8
+ - trl
9
  licence: license
10
  ---
11
 
adapter_config.json CHANGED
@@ -28,16 +28,16 @@
28
  "rank_pattern": {},
29
  "revision": null,
30
  "target_modules": [
31
- "gate_proj",
32
- "down_proj",
33
- "o_proj",
34
- "out_proj",
35
  "fc1",
36
- "fc2",
37
  "k_proj",
38
- "q_proj",
 
39
  "v_proj",
40
- "up_proj"
 
 
 
 
41
  ],
42
  "task_type": "CAUSAL_LM",
43
  "trainable_token_indices": null,
 
28
  "rank_pattern": {},
29
  "revision": null,
30
  "target_modules": [
 
 
 
 
31
  "fc1",
 
32
  "k_proj",
33
+ "up_proj",
34
+ "fc2",
35
  "v_proj",
36
+ "gate_proj",
37
+ "q_proj",
38
+ "down_proj",
39
+ "out_proj",
40
+ "o_proj"
41
  ],
42
  "task_type": "CAUSAL_LM",
43
  "trainable_token_indices": null,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bf5fa9b899a38daa5c696d7a740c17d33e2898bc9ff60d6f979c1af3712e6fdc
3
  size 2839126480
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d972fd9e4f7282985b79660e5062baa43d32e2b18d7db4fd29c74ce6a7ccb56d
3
  size 2839126480
runs/Jul27_21-30-05_d6078ce9c2bc/events.out.tfevents.1753651808.d6078ce9c2bc.5963.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:628d0989349f7e12a5954588f12c10fca8109fbf7f2cbc4824a63c926abbac1e
3
+ size 9321
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4bb45a931c712b28ddfc3a2b5a71094622f2fd49fc71c7893067d7b36518b1f3
3
  size 5816
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0880f1ca061da9fdbc8805850d5a7cdd349321c64acfa88aab788b0d57e8d65e
3
  size 5816