Upload folder using huggingface_hub

Files changed (10) hide show

adapter_config.json CHANGED Viewed

@@ -25,9 +25,9 @@
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
-    "q_proj",
-    "o_proj",
     "v_proj",
     "k_proj"
   ],
   "task_type": "CAUSAL_LM",

   "rank_pattern": {},
   "revision": null,
   "target_modules": [
     "v_proj",
+    "o_proj",
+    "q_proj",
     "k_proj"
   ],
   "task_type": "CAUSAL_LM",

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e468e2d77297d7ad91d2aa50ebdc3d4dcefb69defd07547654dbdaa3484a17f1
 size 33588528

 version https://git-lfs.github.com/spec/v1
+oid sha256:7527027d86c2f99fb4a21349c730585d104c214f60e49f314d66f5a733bc9a50
 size 33588528

checkpoint-50/adapter_config.json CHANGED Viewed

@@ -25,9 +25,9 @@
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
-    "q_proj",
-    "o_proj",
     "v_proj",
     "k_proj"
   ],
   "task_type": "CAUSAL_LM",

   "rank_pattern": {},
   "revision": null,
   "target_modules": [
     "v_proj",
+    "o_proj",
+    "q_proj",
     "k_proj"
   ],
   "task_type": "CAUSAL_LM",

checkpoint-50/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e468e2d77297d7ad91d2aa50ebdc3d4dcefb69defd07547654dbdaa3484a17f1
 size 33588528

 version https://git-lfs.github.com/spec/v1
+oid sha256:7527027d86c2f99fb4a21349c730585d104c214f60e49f314d66f5a733bc9a50
 size 33588528

checkpoint-50/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a8fba518fb2ff6da256d9f7c587bf8689c7ee4025b42948ae0259e31306c7d11
 size 17338708

 version https://git-lfs.github.com/spec/v1
+oid sha256:c074625f59c355cb1db0e83337b49e4b45d7202294c8e85514c2b801bff024e7
 size 17338708

checkpoint-50/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3cf89169291703cf6b96550e33edc2c6a95bc870029fa76b33d1b7b4507afeb6
 size 14244

 version https://git-lfs.github.com/spec/v1
+oid sha256:354615fc8387693f24d82e680c5229ada92ecc73c65770aa0d2ec2f22d519ce2
 size 14244

checkpoint-50/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9d4e40b4ba2b33c214f8a0e942f429620d2826c1735b2b9fa48265d44caa87cb
 size 988

 version https://git-lfs.github.com/spec/v1
+oid sha256:4ae5b6e1493c7b53e741deaed6ac33c1459c9d8e052b89f8241e547b1872d8a8
 size 988

checkpoint-50/trainer_state.json CHANGED Viewed

@@ -2,7 +2,7 @@
   "best_global_step": null,
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 25.0,
   "eval_steps": 500,
   "global_step": 50,
   "is_hyper_param_search": false,
@@ -10,45 +10,45 @@
   "is_world_process_zero": true,
   "log_history": [
     {
-      "epoch": 5.0,
-      "grad_norm": 1.823412537574768,
       "learning_rate": 0.00014,
-      "loss": 2.6875,
       "step": 10
     },
     {
-      "epoch": 10.0,
-      "grad_norm": 0.30645912885665894,
       "learning_rate": 0.000165,
-      "loss": 1.9697,
       "step": 20
     },
     {
-      "epoch": 15.0,
-      "grad_norm": 0.487067312002182,
       "learning_rate": 0.00011499999999999999,
-      "loss": 1.5021,
       "step": 30
     },
     {
-      "epoch": 20.0,
-      "grad_norm": 0.8200891613960266,
       "learning_rate": 6.500000000000001e-05,
-      "loss": 1.234,
       "step": 40
     },
     {
-      "epoch": 25.0,
-      "grad_norm": 0.9909401535987854,
       "learning_rate": 1.5e-05,
-      "loss": 0.9953,
       "step": 50
     }
   ],
   "logging_steps": 10,
   "max_steps": 50,
   "num_input_tokens_seen": 0,
-  "num_train_epochs": 25,
   "save_steps": 50,
   "stateful_callbacks": {
     "TrainerControl": {
@@ -62,7 +62,7 @@
       "attributes": {}
     }
   },
-  "total_flos": 4064705878425600.0,
   "train_batch_size": 1,
   "trial_name": null,
   "trial_params": null

   "best_global_step": null,
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 12.533333333333333,
   "eval_steps": 500,
   "global_step": 50,
   "is_hyper_param_search": false,
   "is_world_process_zero": true,
   "log_history": [
     {
+      "epoch": 2.533333333333333,
+      "grad_norm": 5.1353068351745605,
       "learning_rate": 0.00014,
+      "loss": 7.9209,
       "step": 10
     },
     {
+      "epoch": 5.0,
+      "grad_norm": 1.2159311771392822,
       "learning_rate": 0.000165,
+      "loss": 3.5184,
       "step": 20
     },
     {
+      "epoch": 7.533333333333333,
+      "grad_norm": 0.17727278172969818,
       "learning_rate": 0.00011499999999999999,
+      "loss": 1.3178,
       "step": 30
     },
     {
+      "epoch": 10.0,
+      "grad_norm": 0.20721666514873505,
       "learning_rate": 6.500000000000001e-05,
+      "loss": 1.3595,
       "step": 40
     },
     {
+      "epoch": 12.533333333333333,
+      "grad_norm": 0.1987001746892929,
       "learning_rate": 1.5e-05,
+      "loss": 1.2959,
       "step": 50
     }
   ],
   "logging_steps": 10,
   "max_steps": 50,
   "num_input_tokens_seen": 0,
+  "num_train_epochs": 13,
   "save_steps": 50,
   "stateful_callbacks": {
     "TrainerControl": {
       "attributes": {}
     }
   },
+  "total_flos": 7641647051440128.0,
   "train_batch_size": 1,
   "trial_name": null,
   "trial_params": null

checkpoint-50/training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3e806016397e36524f90ee92db251177b3f47cb2b360e8ff461ef1d934439559
 size 5304

 version https://git-lfs.github.com/spec/v1
+oid sha256:d803a248f86aede78be3460d30806bdea503d572393c5e5c9706e3cd81f51c6e
 size 5304

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3e806016397e36524f90ee92db251177b3f47cb2b360e8ff461ef1d934439559
 size 5304

 version https://git-lfs.github.com/spec/v1
+oid sha256:d803a248f86aede78be3460d30806bdea503d572393c5e5c9706e3cd81f51c6e
 size 5304