Upload folder using huggingface_hub

Files changed (10) hide show

adapter_config.json CHANGED Viewed

@@ -25,10 +25,10 @@
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
-    "v_proj",
-    "o_proj",
     "q_proj",
-    "k_proj"
   ],
   "task_type": "CAUSAL_LM",
   "trainable_token_indices": null,

   "rank_pattern": {},
   "revision": null,
   "target_modules": [
     "q_proj",
+    "k_proj",
+    "v_proj",
+    "o_proj"
   ],
   "task_type": "CAUSAL_LM",
   "trainable_token_indices": null,

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:616d027fb005edff9745e7c771538e7da2b03596707bad0242163b2fc606ad11
 size 33588528

 version https://git-lfs.github.com/spec/v1
+oid sha256:52bc3ecfc964e633b395cf812586870c7cc362c3ed21ac4c7b593874543c7975
 size 33588528

checkpoint-50/adapter_config.json CHANGED Viewed

@@ -25,10 +25,10 @@
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
-    "v_proj",
-    "o_proj",
     "q_proj",
-    "k_proj"
   ],
   "task_type": "CAUSAL_LM",
   "trainable_token_indices": null,

   "rank_pattern": {},
   "revision": null,
   "target_modules": [
     "q_proj",
+    "k_proj",
+    "v_proj",
+    "o_proj"
   ],
   "task_type": "CAUSAL_LM",
   "trainable_token_indices": null,

checkpoint-50/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:616d027fb005edff9745e7c771538e7da2b03596707bad0242163b2fc606ad11
 size 33588528

 version https://git-lfs.github.com/spec/v1
+oid sha256:52bc3ecfc964e633b395cf812586870c7cc362c3ed21ac4c7b593874543c7975
 size 33588528

checkpoint-50/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a580fd932e1b65d83e870d30e92e823e851317b9f942cefdcc0d34b4aac5f263
 size 17338708

 version https://git-lfs.github.com/spec/v1
+oid sha256:38322fa67c0cd9b4bea2f8ed1ea3fa702cf1c76a8e623fe2b4b4468e581047b2
 size 17338708

checkpoint-50/scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f4a0e99f2cd8a3b5675a350b3b4e3d065c31530d1da439f4d4e2562f4cf72cd2
 size 988

 version https://git-lfs.github.com/spec/v1
+oid sha256:e16548743276424cd66e7996bdcfd2223400028fb58a78b40458f14aa4250dd8
 size 988

checkpoint-50/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:fc546be0326b4a0b2e6a212bb8589b29ecc3eb77870dc69fdc4706bbcece8bf2
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:55a3b0f2ba55e355a29b19063f461fa9b5392d5c673dcc7784da8b9c5691fb1f
 size 1064

checkpoint-50/trainer_state.json CHANGED Viewed

@@ -11,37 +11,37 @@
   "log_history": [
     {
       "epoch": 0.16,
-      "grad_norm": 41.431053161621094,
       "learning_rate": 0.00012,
-      "loss": 33.6557,
       "step": 10
     },
     {
       "epoch": 0.32,
-      "grad_norm": 7.633413314819336,
-      "learning_rate": 0.00017,
-      "loss": 13.5995,
       "step": 20
     },
     {
       "epoch": 0.48,
-      "grad_norm": 0.17992551624774933,
-      "learning_rate": 0.00012,
-      "loss": 0.1692,
       "step": 30
     },
     {
       "epoch": 0.64,
-      "grad_norm": 0.11148593574762344,
-      "learning_rate": 7e-05,
-      "loss": 0.1384,
       "step": 40
     },
     {
       "epoch": 0.8,
-      "grad_norm": 0.11761105805635452,
-      "learning_rate": 2e-05,
-      "loss": 0.115,
       "step": 50
     }
   ],

   "log_history": [
     {
       "epoch": 0.16,
+      "grad_norm": NaN,
       "learning_rate": 0.00012,
+      "loss": 33.5024,
       "step": 10
     },
     {
       "epoch": 0.32,
+      "grad_norm": 8.700640678405762,
+      "learning_rate": 0.000175,
+      "loss": 16.2186,
       "step": 20
     },
     {
       "epoch": 0.48,
+      "grad_norm": 0.22131234407424927,
+      "learning_rate": 0.000125,
+      "loss": 0.1905,
       "step": 30
     },
     {
       "epoch": 0.64,
+      "grad_norm": 0.11870493739843369,
+      "learning_rate": 7.500000000000001e-05,
+      "loss": 0.1386,
       "step": 40
     },
     {
       "epoch": 0.8,
+      "grad_norm": 0.1110013872385025,
+      "learning_rate": 2.5e-05,
+      "loss": 0.1143,
       "step": 50
     }
   ],

checkpoint-50/training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f1f0bc7579225e5bda2d02e3f9ab438477eceb2e35462a762b5f86825bd52af8
 size 5304

 version https://git-lfs.github.com/spec/v1
+oid sha256:b1f60acf5fc471590e2b4ac63d9c481ed856618b1b406e6a68b2ac2ff182d6d1
 size 5304

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f1f0bc7579225e5bda2d02e3f9ab438477eceb2e35462a762b5f86825bd52af8
 size 5304

 version https://git-lfs.github.com/spec/v1
+oid sha256:b1f60acf5fc471590e2b4ac63d9c481ed856618b1b406e6a68b2ac2ff182d6d1
 size 5304