pyamy commited on
Commit
ffc0564
·
verified ·
1 Parent(s): a63ba8e

Upload folder using huggingface_hub

Browse files
adapter_config.json CHANGED
@@ -25,10 +25,10 @@
25
  "rank_pattern": {},
26
  "revision": null,
27
  "target_modules": [
28
- "v_proj",
29
  "q_proj",
30
- "k_proj",
31
- "o_proj"
 
32
  ],
33
  "task_type": "CAUSAL_LM",
34
  "trainable_token_indices": null,
 
25
  "rank_pattern": {},
26
  "revision": null,
27
  "target_modules": [
 
28
  "q_proj",
29
+ "o_proj",
30
+ "v_proj",
31
+ "k_proj"
32
  ],
33
  "task_type": "CAUSAL_LM",
34
  "trainable_token_indices": null,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:13ba49c8c8687d106786e91b8c0258edff6596f2dd11380fe35f520091103336
3
  size 33588528
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e468e2d77297d7ad91d2aa50ebdc3d4dcefb69defd07547654dbdaa3484a17f1
3
  size 33588528
checkpoint-50/adapter_config.json CHANGED
@@ -25,9 +25,9 @@
25
  "rank_pattern": {},
26
  "revision": null,
27
  "target_modules": [
28
- "v_proj",
29
- "o_proj",
30
  "q_proj",
 
 
31
  "k_proj"
32
  ],
33
  "task_type": "CAUSAL_LM",
 
25
  "rank_pattern": {},
26
  "revision": null,
27
  "target_modules": [
 
 
28
  "q_proj",
29
+ "o_proj",
30
+ "v_proj",
31
  "k_proj"
32
  ],
33
  "task_type": "CAUSAL_LM",
checkpoint-50/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:13be47a2dabeff36de460c674873690540819ce5dc76774e918e6c6350816d01
3
  size 33588528
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e468e2d77297d7ad91d2aa50ebdc3d4dcefb69defd07547654dbdaa3484a17f1
3
  size 33588528
checkpoint-50/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d0b131699f30ee0b6f7adbe1e51d969e0f294bff32e6a3e5b10457540c26eeea
3
  size 17338708
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8fba518fb2ff6da256d9f7c587bf8689c7ee4025b42948ae0259e31306c7d11
3
  size 17338708
checkpoint-50/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a206d9f667d8ea3ff758745bc598392dfea22625e5fa47093cb96bf116f36e32
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3cf89169291703cf6b96550e33edc2c6a95bc870029fa76b33d1b7b4507afeb6
3
  size 14244
checkpoint-50/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:679891a6f5a888edbeebb4d778cff89972ef778c4087bae746c97dfe9244f249
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9d4e40b4ba2b33c214f8a0e942f429620d2826c1735b2b9fa48265d44caa87cb
3
  size 988
checkpoint-50/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e417c65f270cd74e6f1d7db3f4d911a6218769029f43db0bb8de7fec70c27119
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:281827ead75066f664b29f5c22ee974cb25ad2d35f99b381f96c3f43fe213728
3
  size 1064
checkpoint-50/trainer_state.json CHANGED
@@ -2,7 +2,7 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 16.88888888888889,
6
  "eval_steps": 500,
7
  "global_step": 50,
8
  "is_hyper_param_search": false,
@@ -10,45 +10,45 @@
10
  "is_world_process_zero": true,
11
  "log_history": [
12
  {
13
- "epoch": 3.4444444444444446,
14
- "grad_norm": 0.23509381711483002,
15
- "learning_rate": 0.00018,
16
- "loss": 1.8657,
17
  "step": 10
18
  },
19
  {
20
- "epoch": 6.888888888888889,
21
- "grad_norm": 0.4787384867668152,
22
- "learning_rate": 0.000155,
23
- "loss": 1.6866,
24
  "step": 20
25
  },
26
  {
27
- "epoch": 10.0,
28
- "grad_norm": 0.880219042301178,
29
- "learning_rate": 0.000105,
30
- "loss": 1.3819,
31
  "step": 30
32
  },
33
  {
34
- "epoch": 13.444444444444445,
35
- "grad_norm": 0.641683042049408,
36
- "learning_rate": 5.500000000000001e-05,
37
- "loss": 1.1817,
38
  "step": 40
39
  },
40
  {
41
- "epoch": 16.88888888888889,
42
- "grad_norm": 0.681348979473114,
43
- "learning_rate": 5e-06,
44
- "loss": 1.022,
45
  "step": 50
46
  }
47
  ],
48
  "logging_steps": 10,
49
  "max_steps": 50,
50
  "num_input_tokens_seen": 0,
51
- "num_train_epochs": 17,
52
  "save_steps": 50,
53
  "stateful_callbacks": {
54
  "TrainerControl": {
@@ -62,7 +62,7 @@
62
  "attributes": {}
63
  }
64
  },
65
- "total_flos": 3089176467603456.0,
66
  "train_batch_size": 1,
67
  "trial_name": null,
68
  "trial_params": null
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 25.0,
6
  "eval_steps": 500,
7
  "global_step": 50,
8
  "is_hyper_param_search": false,
 
10
  "is_world_process_zero": true,
11
  "log_history": [
12
  {
13
+ "epoch": 5.0,
14
+ "grad_norm": 1.823412537574768,
15
+ "learning_rate": 0.00014,
16
+ "loss": 2.6875,
17
  "step": 10
18
  },
19
  {
20
+ "epoch": 10.0,
21
+ "grad_norm": 0.30645912885665894,
22
+ "learning_rate": 0.000165,
23
+ "loss": 1.9697,
24
  "step": 20
25
  },
26
  {
27
+ "epoch": 15.0,
28
+ "grad_norm": 0.487067312002182,
29
+ "learning_rate": 0.00011499999999999999,
30
+ "loss": 1.5021,
31
  "step": 30
32
  },
33
  {
34
+ "epoch": 20.0,
35
+ "grad_norm": 0.8200891613960266,
36
+ "learning_rate": 6.500000000000001e-05,
37
+ "loss": 1.234,
38
  "step": 40
39
  },
40
  {
41
+ "epoch": 25.0,
42
+ "grad_norm": 0.9909401535987854,
43
+ "learning_rate": 1.5e-05,
44
+ "loss": 0.9953,
45
  "step": 50
46
  }
47
  ],
48
  "logging_steps": 10,
49
  "max_steps": 50,
50
  "num_input_tokens_seen": 0,
51
+ "num_train_epochs": 25,
52
  "save_steps": 50,
53
  "stateful_callbacks": {
54
  "TrainerControl": {
 
62
  "attributes": {}
63
  }
64
  },
65
+ "total_flos": 4064705878425600.0,
66
  "train_batch_size": 1,
67
  "trial_name": null,
68
  "trial_params": null
checkpoint-50/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3fd48ad7e7c5bcb67d8f7bec6dd926a2d8d3ad361b44ce136d6d2d7c994e8199
3
  size 5304
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e806016397e36524f90ee92db251177b3f47cb2b360e8ff461ef1d934439559
3
  size 5304
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f4e8f1dd9a9d5ca2ecbbfcb36f632a8f15434d2f5f952ac45738d3abf965e26a
3
  size 5304
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e806016397e36524f90ee92db251177b3f47cb2b360e8ff461ef1d934439559
3
  size 5304