End of training

Browse files

Files changed (5) hide show

README.md +2 -1
all_results.json +8 -0
train_results.json +8 -0
trainer_state.json +603 -0
training_loss.png +0 -0

README.md CHANGED Viewed

@@ -4,6 +4,7 @@ license: apache-2.0
 base_model: Qwen/Qwen3-4B-Instruct-2507
 tags:
 - llama-factory
 - generated_from_trainer
 model-index:
 - name: Qwen3-4B-Instruct_0910_LODO_gitlab_full
@@ -15,7 +16,7 @@ should probably proofread and complete it, then remove this comment. -->
 # Qwen3-4B-Instruct_0910_LODO_gitlab_full
-This model is a fine-tuned version of [Qwen/Qwen3-4B-Instruct-2507](https://huggingface.co/Qwen/Qwen3-4B-Instruct-2507) on an unknown dataset.
 ## Model description

 base_model: Qwen/Qwen3-4B-Instruct-2507
 tags:
 - llama-factory
+- full
 - generated_from_trainer
 model-index:
 - name: Qwen3-4B-Instruct_0910_LODO_gitlab_full
 # Qwen3-4B-Instruct_0910_LODO_gitlab_full
+This model is a fine-tuned version of [Qwen/Qwen3-4B-Instruct-2507](https://huggingface.co/Qwen/Qwen3-4B-Instruct-2507) on the Policy_Traj_LODO_gitlab dataset.
 ## Model description

all_results.json ADDED Viewed

	@@ -0,0 +1,8 @@

+{
+    "epoch": 3.0,
+    "total_flos": 33113178439680.0,
+    "train_loss": 0.042386234274015444,
+    "train_runtime": 4174.8779,
+    "train_samples_per_second": 24.521,
+    "train_steps_per_second": 0.192
+}

train_results.json ADDED Viewed

	@@ -0,0 +1,8 @@

+{
+    "epoch": 3.0,
+    "total_flos": 33113178439680.0,
+    "train_loss": 0.042386234274015444,
+    "train_runtime": 4174.8779,
+    "train_samples_per_second": 24.521,
+    "train_steps_per_second": 0.192
+}

trainer_state.json ADDED Viewed

	@@ -0,0 +1,603 @@

+{
+  "best_global_step": null,
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 3.0,
+  "eval_steps": 500,
+  "global_step": 801,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.03750586029067042,
+      "grad_norm": 34.85824610814536,
+      "learning_rate": 1.8e-05,
+      "loss": 0.3557,
+      "step": 10
+    },
+    {
+      "epoch": 0.07501172058134084,
+      "grad_norm": 7.1481602122450285,
+      "learning_rate": 3.8e-05,
+      "loss": 0.1487,
+      "step": 20
+    },
+    {
+      "epoch": 0.11251758087201125,
+      "grad_norm": 8.614036123620082,
+      "learning_rate": 4.999672209164081e-05,
+      "loss": 0.1396,
+      "step": 30
+    },
+    {
+      "epoch": 0.15002344116268168,
+      "grad_norm": 10.10705100519714,
+      "learning_rate": 4.995985549356568e-05,
+      "loss": 0.0895,
+      "step": 40
+    },
+    {
+      "epoch": 0.1875293014533521,
+      "grad_norm": 5.6723632225651555,
+      "learning_rate": 4.988208552916535e-05,
+      "loss": 0.0733,
+      "step": 50
+    },
+    {
+      "epoch": 0.2250351617440225,
+      "grad_norm": 3.5917593429678067,
+      "learning_rate": 4.976353964522509e-05,
+      "loss": 0.2835,
+      "step": 60
+    },
+    {
+      "epoch": 0.26254102203469293,
+      "grad_norm": 2.7853884780818023,
+      "learning_rate": 4.960441211072686e-05,
+      "loss": 0.0559,
+      "step": 70
+    },
+    {
+      "epoch": 0.30004688232536336,
+      "grad_norm": 1.0618750438052633,
+      "learning_rate": 4.940496369848795e-05,
+      "loss": 0.0562,
+      "step": 80
+    },
+    {
+      "epoch": 0.33755274261603374,
+      "grad_norm": 0.21567312878465145,
+      "learning_rate": 4.916552125781528e-05,
+      "loss": 0.0545,
+      "step": 90
+    },
+    {
+      "epoch": 0.3750586029067042,
+      "grad_norm": 6.591249771359263,
+      "learning_rate": 4.8886477178875826e-05,
+      "loss": 0.0665,
+      "step": 100
+    },
+    {
+      "epoch": 0.4125644631973746,
+      "grad_norm": 0.2514334496388468,
+      "learning_rate": 4.856828874966086e-05,
+      "loss": 0.0577,
+      "step": 110
+    },
+    {
+      "epoch": 0.450070323488045,
+      "grad_norm": 2.19013548059961,
+      "learning_rate": 4.821147740659794e-05,
+      "loss": 0.0424,
+      "step": 120
+    },
+    {
+      "epoch": 0.4875761837787154,
+      "grad_norm": 1.8200457984558476,
+      "learning_rate": 4.781662788003851e-05,
+      "loss": 0.0435,
+      "step": 130
+    },
+    {
+      "epoch": 0.5250820440693859,
+      "grad_norm": 1.788433839164408,
+      "learning_rate": 4.738438723602154e-05,
+      "loss": 0.0459,
+      "step": 140
+    },
+    {
+      "epoch": 0.5625879043600562,
+      "grad_norm": 3.4278131423512943,
+      "learning_rate": 4.69154638158837e-05,
+      "loss": 0.0416,
+      "step": 150
+    },
+    {
+      "epoch": 0.6000937646507267,
+      "grad_norm": 0.26651980565241046,
+      "learning_rate": 4.641062607545347e-05,
+      "loss": 0.0422,
+      "step": 160
+    },
+    {
+      "epoch": 0.6375996249413971,
+      "grad_norm": 1.6317479332317566,
+      "learning_rate": 4.587070132573178e-05,
+      "loss": 0.0388,
+      "step": 170
+    },
+    {
+      "epoch": 0.6751054852320675,
+      "grad_norm": 1.6520649014609303,
+      "learning_rate": 4.529657437712276e-05,
+      "loss": 0.0334,
+      "step": 180
+    },
+    {
+      "epoch": 0.712611345522738,
+      "grad_norm": 0.15277860741515586,
+      "learning_rate": 4.4689186089436366e-05,
+      "loss": 0.0412,
+      "step": 190
+    },
+    {
+      "epoch": 0.7501172058134083,
+      "grad_norm": 0.9030791837609309,
+      "learning_rate": 4.404953183003916e-05,
+      "loss": 0.036,
+      "step": 200
+    },
+    {
+      "epoch": 0.7876230661040787,
+      "grad_norm": 1.9866732218980805,
+      "learning_rate": 4.337865984268001e-05,
+      "loss": 0.0393,
+      "step": 210
+    },
+    {
+      "epoch": 0.8251289263947492,
+      "grad_norm": 0.23596674543489504,
+      "learning_rate": 4.267766952966369e-05,
+      "loss": 0.0385,
+      "step": 220
+    },
+    {
+      "epoch": 0.8626347866854196,
+      "grad_norm": 2.7613828112655905,
+      "learning_rate": 4.194770965018758e-05,
+      "loss": 0.0411,
+      "step": 230
+    },
+    {
+      "epoch": 0.90014064697609,
+      "grad_norm": 0.9440762280964653,
+      "learning_rate": 4.118997643779401e-05,
+      "loss": 0.0346,
+      "step": 240
+    },
+    {
+      "epoch": 0.9376465072667605,
+      "grad_norm": 0.41009567832530625,
+      "learning_rate": 4.0405711640023186e-05,
+      "loss": 0.0344,
+      "step": 250
+    },
+    {
+      "epoch": 0.9751523675574308,
+      "grad_norm": 0.32482405462507263,
+      "learning_rate": 3.9596200483479385e-05,
+      "loss": 0.0324,
+      "step": 260
+    },
+    {
+      "epoch": 1.0112517580872011,
+      "grad_norm": 0.806991725526476,
+      "learning_rate": 3.876276956764509e-05,
+      "loss": 0.0346,
+      "step": 270
+    },
+    {
+      "epoch": 1.0487576183778715,
+      "grad_norm": 1.1338976875621802,
+      "learning_rate": 3.7906784690894645e-05,
+      "loss": 0.0424,
+      "step": 280
+    },
+    {
+      "epoch": 1.086263478668542,
+      "grad_norm": 1.500478633231241,
+      "learning_rate": 3.702964861227013e-05,
+      "loss": 0.0346,
+      "step": 290
+    },
+    {
+      "epoch": 1.1237693389592125,
+      "grad_norm": 1.4409676013917596,
+      "learning_rate": 3.613279875268731e-05,
+      "loss": 0.0354,
+      "step": 300
+    },
+    {
+      "epoch": 1.1612751992498829,
+      "grad_norm": 0.2422476126318276,
+      "learning_rate": 3.521770483933891e-05,
+      "loss": 0.034,
+      "step": 310
+    },
+    {
+      "epoch": 1.1987810595405533,
+      "grad_norm": 1.5840918548478307,
+      "learning_rate": 3.4285866497155414e-05,
+      "loss": 0.0459,
+      "step": 320
+    },
+    {
+      "epoch": 1.2362869198312236,
+      "grad_norm": 0.37403459055017013,
+      "learning_rate": 3.333881079127052e-05,
+      "loss": 0.0292,
+      "step": 330
+    },
+    {
+      "epoch": 1.273792780121894,
+      "grad_norm": 0.7618214390592176,
+      "learning_rate": 3.2378089724518465e-05,
+      "loss": 0.0279,
+      "step": 340
+    },
+    {
+      "epoch": 1.3112986404125644,
+      "grad_norm": 0.6779062975577348,
+      "learning_rate": 3.1405277694064305e-05,
+      "loss": 0.0317,
+      "step": 350
+    },
+    {
+      "epoch": 1.3488045007032348,
+      "grad_norm": 0.6053365729294653,
+      "learning_rate": 3.0421968911335196e-05,
+      "loss": 0.0332,
+      "step": 360
+    },
+    {
+      "epoch": 1.3863103609939054,
+      "grad_norm": 0.5023346538140172,
+      "learning_rate": 2.9429774789480575e-05,
+      "loss": 0.0258,
+      "step": 370
+    },
+    {
+      "epoch": 1.4238162212845757,
+      "grad_norm": 0.1512518290372575,
+      "learning_rate": 2.843032130264289e-05,
+      "loss": 0.0254,
+      "step": 380
+    },
+    {
+      "epoch": 1.4613220815752461,
+      "grad_norm": 0.4256415803778755,
+      "learning_rate": 2.7425246321366203e-05,
+      "loss": 0.0289,
+      "step": 390
+    },
+    {
+      "epoch": 1.4988279418659165,
+      "grad_norm": 2.0526292381935587,
+      "learning_rate": 2.6416196928509408e-05,
+      "loss": 0.0293,
+      "step": 400
+    },
+    {
+      "epoch": 1.5363338021565869,
+      "grad_norm": 2.199901935419105,
+      "learning_rate": 2.540482672006254e-05,
+      "loss": 0.0324,
+      "step": 410
+    },
+    {
+      "epoch": 1.5738396624472575,
+      "grad_norm": 0.6587554924832156,
+      "learning_rate": 2.4392793095289677e-05,
+      "loss": 0.0318,
+      "step": 420
+    },
+    {
+      "epoch": 1.6113455227379276,
+      "grad_norm": 0.11953774619854174,
+      "learning_rate": 2.338175454063911e-05,
+      "loss": 0.027,
+      "step": 430
+    },
+    {
+      "epoch": 1.6488513830285982,
+      "grad_norm": 1.8366328720607281,
+      "learning_rate": 2.2373367911871904e-05,
+      "loss": 0.0271,
+      "step": 440
+    },
+    {
+      "epoch": 1.6863572433192686,
+      "grad_norm": 0.16134023570988165,
+      "learning_rate": 2.136928571886275e-05,
+      "loss": 0.0309,
+      "step": 450
+    },
+    {
+      "epoch": 1.723863103609939,
+      "grad_norm": 0.5782347760396018,
+      "learning_rate": 2.03711534175227e-05,
+      "loss": 0.0276,
+      "step": 460
+    },
+    {
+      "epoch": 1.7613689639006096,
+      "grad_norm": 0.7600638604790938,
+      "learning_rate": 1.9380606713281775e-05,
+      "loss": 0.0284,
+      "step": 470
+    },
+    {
+      "epoch": 1.7988748241912798,
+      "grad_norm": 0.28905055512217726,
+      "learning_rate": 1.8399268880550174e-05,
+      "loss": 0.0289,
+      "step": 480
+    },
+    {
+      "epoch": 1.8363806844819504,
+      "grad_norm": 0.47269674339106393,
+      "learning_rate": 1.7428748102551237e-05,
+      "loss": 0.0254,
+      "step": 490
+    },
+    {
+      "epoch": 1.8738865447726207,
+      "grad_norm": 0.1126048083243114,
+      "learning_rate": 1.6470634835885097e-05,
+      "loss": 0.0329,
+      "step": 500
+    },
+    {
+      "epoch": 1.9113924050632911,
+      "grad_norm": 0.4869034202302143,
+      "learning_rate": 1.552649920414233e-05,
+      "loss": 0.0294,
+      "step": 510
+    },
+    {
+      "epoch": 1.9488982653539617,
+      "grad_norm": 0.1048044631528693,
+      "learning_rate": 1.4597888424838518e-05,
+      "loss": 0.03,
+      "step": 520
+    },
+    {
+      "epoch": 1.9864041256446319,
+      "grad_norm": 0.257084202132171,
+      "learning_rate": 1.368632427388653e-05,
+      "loss": 0.0263,
+      "step": 530
+    },
+    {
+      "epoch": 2.0225035161744023,
+      "grad_norm": 0.41612935348774654,
+      "learning_rate": 1.2793300591761742e-05,
+      "loss": 0.0255,
+      "step": 540
+    },
+    {
+      "epoch": 2.060009376465073,
+      "grad_norm": 0.1472784892712205,
+      "learning_rate": 1.1920280835446748e-05,
+      "loss": 0.019,
+      "step": 550
+    },
+    {
+      "epoch": 2.097515236755743,
+      "grad_norm": 0.7021607086288816,
+      "learning_rate": 1.1068695680167664e-05,
+      "loss": 0.0259,
+      "step": 560
+    },
+    {
+      "epoch": 2.1350210970464136,
+      "grad_norm": 1.0121270104703033,
+      "learning_rate": 1.0239940674851941e-05,
+      "loss": 0.0228,
+      "step": 570
+    },
+    {
+      "epoch": 2.172526957337084,
+      "grad_norm": 0.8364824257153406,
+      "learning_rate": 9.43537395515003e-06,
+      "loss": 0.0233,
+      "step": 580
+    },
+    {
+      "epoch": 2.2100328176277544,
+      "grad_norm": 0.29831710959245356,
+      "learning_rate": 8.656314017768693e-06,
+      "loss": 0.0213,
+      "step": 590
+    },
+    {
+      "epoch": 2.247538677918425,
+      "grad_norm": 0.21598369420228658,
+      "learning_rate": 7.904037559763162e-06,
+      "loss": 0.0228,
+      "step": 600
+    },
+    {
+      "epoch": 2.285044538209095,
+      "grad_norm": 0.5662760774283471,
+      "learning_rate": 7.179777386329276e-06,
+      "loss": 0.0184,
+      "step": 610
+    },
+    {
+      "epoch": 2.3225503984997657,
+      "grad_norm": 0.10841392927498035,
+      "learning_rate": 6.484720390524007e-06,
+      "loss": 0.0223,
+      "step": 620
+    },
+    {
+      "epoch": 2.360056258790436,
+      "grad_norm": 0.2351999089031456,
+      "learning_rate": 5.820005608225346e-06,
+      "loss": 0.0221,
+      "step": 630
+    },
+    {
+      "epoch": 2.3975621190811065,
+      "grad_norm": 0.27088765350399413,
+      "learning_rate": 5.186722351518822e-06,
+      "loss": 0.0276,
+      "step": 640
+    },
+    {
+      "epoch": 2.4350679793717767,
+      "grad_norm": 0.08323548651396794,
+      "learning_rate": 4.585908423569724e-06,
+      "loss": 0.0209,
+      "step": 650
+    },
+    {
+      "epoch": 2.4725738396624473,
+      "grad_norm": 0.21245905268041415,
+      "learning_rate": 4.0185484179064425e-06,
+      "loss": 0.0233,
+      "step": 660
+    },
+    {
+      "epoch": 2.510079699953118,
+      "grad_norm": 0.5537577775149638,
+      "learning_rate": 3.4855721049018688e-06,
+      "loss": 0.0229,
+      "step": 670
+    },
+    {
+      "epoch": 2.547585560243788,
+      "grad_norm": 0.7847967042002256,
+      "learning_rate": 2.98785290809723e-06,
+      "loss": 0.0253,
+      "step": 680
+    },
+    {
+      "epoch": 2.5850914205344586,
+      "grad_norm": 0.507105447694394,
+      "learning_rate": 2.52620647286512e-06,
+      "loss": 0.0206,
+      "step": 690
+    },
+    {
+      "epoch": 2.6225972808251288,
+      "grad_norm": 0.24719979538798334,
+      "learning_rate": 2.101389329757478e-06,
+      "loss": 0.0172,
+      "step": 700
+    },
+    {
+      "epoch": 2.6601031411157994,
+      "grad_norm": 0.481232043094042,
+      "learning_rate": 1.7140976547289438e-06,
+      "loss": 0.0197,
+      "step": 710
+    },
+    {
+      "epoch": 2.6976090014064695,
+      "grad_norm": 0.525987532669796,
+      "learning_rate": 1.3649661282672476e-06,
+      "loss": 0.0202,
+      "step": 720
+    },
+    {
+      "epoch": 2.73511486169714,
+      "grad_norm": 0.12411824566724937,
+      "learning_rate": 1.0545668953003241e-06,
+      "loss": 0.0215,
+      "step": 730
+    },
+    {
+      "epoch": 2.7726207219878107,
+      "grad_norm": 0.2216514712018457,
+      "learning_rate": 7.834086275845587e-07,
+      "loss": 0.0182,
+      "step": 740
+    },
+    {
+      "epoch": 2.810126582278481,
+      "grad_norm": 0.220985617144204,
+      "learning_rate": 5.519356901107358e-07,
+      "loss": 0.0244,
+      "step": 750
+    },
+    {
+      "epoch": 2.8476324425691515,
+      "grad_norm": 0.34207273950972444,
+      "learning_rate": 3.605274128937464e-07,
+      "loss": 0.0233,
+      "step": 760
+    },
+    {
+      "epoch": 2.885138302859822,
+      "grad_norm": 0.11697799335786845,
+      "learning_rate": 2.094974693393731e-07,
+      "loss": 0.019,
+      "step": 770
+    },
+    {
+      "epoch": 2.9226441631504922,
+      "grad_norm": 0.3157831029546487,
+      "learning_rate": 9.90933622069562e-08,
+      "loss": 0.0177,
+      "step": 780
+    },
+    {
+      "epoch": 2.960150023441163,
+      "grad_norm": 0.16740144227166562,
+      "learning_rate": 2.9496018010233274e-08,
+      "loss": 0.022,
+      "step": 790
+    },
+    {
+      "epoch": 2.997655883731833,
+      "grad_norm": 0.33884453903018824,
+      "learning_rate": 8.194905210923143e-10,
+      "loss": 0.0232,
+      "step": 800
+    },
+    {
+      "epoch": 3.0,
+      "step": 801,
+      "total_flos": 33113178439680.0,
+      "train_loss": 0.042386234274015444,
+      "train_runtime": 4174.8779,
+      "train_samples_per_second": 24.521,
+      "train_steps_per_second": 0.192
+    }
+  ],
+  "logging_steps": 10,
+  "max_steps": 801,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 3,
+  "save_steps": 100,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": true
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 33113178439680.0,
+  "train_batch_size": 4,
+  "trial_name": null,
+  "trial_params": null
+}

training_loss.png ADDED Viewed