Rakancorle1 commited on
Commit
51bca50
·
verified ·
1 Parent(s): ba427e6

Training in progress, step 800

Browse files
model-00001-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6c9a9798094b1b959caf4bf48828f2f69b9577171c1bffe168e778eec1ca991a
3
  size 4967215360
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7abe8a8aa4bd4c0faeeb497d12527c03cfc2487a3917df810589eeb1c3d163c4
3
  size 4967215360
model-00002-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4b26cb5105a55b060be420f2dab44a9d7dda283bf60816caf3d61c6a41fb84ce
3
  size 3077766632
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a391bbca2479fd3cd0d25ecbd2711eca1239b2105547d173c0601b1a56402aca
3
  size 3077766632
trainer_log.jsonl CHANGED
@@ -68,3 +68,13 @@
68
  {"current_steps": 680, "total_steps": 801, "loss": 0.0253, "lr": 2.98785290809723e-06, "epoch": 2.547585560243788, "percentage": 84.89, "elapsed_time": "0:57:29", "remaining_time": "0:10:13"}
69
  {"current_steps": 690, "total_steps": 801, "loss": 0.0206, "lr": 2.52620647286512e-06, "epoch": 2.5850914205344586, "percentage": 86.14, "elapsed_time": "0:58:16", "remaining_time": "0:09:22"}
70
  {"current_steps": 700, "total_steps": 801, "loss": 0.0172, "lr": 2.101389329757478e-06, "epoch": 2.6225972808251288, "percentage": 87.39, "elapsed_time": "0:59:03", "remaining_time": "0:08:31"}
 
 
 
 
 
 
 
 
 
 
 
68
  {"current_steps": 680, "total_steps": 801, "loss": 0.0253, "lr": 2.98785290809723e-06, "epoch": 2.547585560243788, "percentage": 84.89, "elapsed_time": "0:57:29", "remaining_time": "0:10:13"}
69
  {"current_steps": 690, "total_steps": 801, "loss": 0.0206, "lr": 2.52620647286512e-06, "epoch": 2.5850914205344586, "percentage": 86.14, "elapsed_time": "0:58:16", "remaining_time": "0:09:22"}
70
  {"current_steps": 700, "total_steps": 801, "loss": 0.0172, "lr": 2.101389329757478e-06, "epoch": 2.6225972808251288, "percentage": 87.39, "elapsed_time": "0:59:03", "remaining_time": "0:08:31"}
71
+ {"current_steps": 710, "total_steps": 801, "loss": 0.0197, "lr": 1.7140976547289438e-06, "epoch": 2.6601031411157994, "percentage": 88.64, "elapsed_time": "1:00:39", "remaining_time": "0:07:46"}
72
+ {"current_steps": 720, "total_steps": 801, "loss": 0.0202, "lr": 1.3649661282672476e-06, "epoch": 2.6976090014064695, "percentage": 89.89, "elapsed_time": "1:01:26", "remaining_time": "0:06:54"}
73
+ {"current_steps": 730, "total_steps": 801, "loss": 0.0215, "lr": 1.0545668953003241e-06, "epoch": 2.73511486169714, "percentage": 91.14, "elapsed_time": "1:02:14", "remaining_time": "0:06:03"}
74
+ {"current_steps": 740, "total_steps": 801, "loss": 0.0182, "lr": 7.834086275845587e-07, "epoch": 2.7726207219878107, "percentage": 92.38, "elapsed_time": "1:03:01", "remaining_time": "0:05:11"}
75
+ {"current_steps": 750, "total_steps": 801, "loss": 0.0244, "lr": 5.519356901107358e-07, "epoch": 2.810126582278481, "percentage": 93.63, "elapsed_time": "1:03:48", "remaining_time": "0:04:20"}
76
+ {"current_steps": 760, "total_steps": 801, "loss": 0.0233, "lr": 3.605274128937464e-07, "epoch": 2.8476324425691515, "percentage": 94.88, "elapsed_time": "1:04:35", "remaining_time": "0:03:29"}
77
+ {"current_steps": 770, "total_steps": 801, "loss": 0.019, "lr": 2.094974693393731e-07, "epoch": 2.885138302859822, "percentage": 96.13, "elapsed_time": "1:05:23", "remaining_time": "0:02:37"}
78
+ {"current_steps": 780, "total_steps": 801, "loss": 0.0177, "lr": 9.90933622069562e-08, "epoch": 2.9226441631504922, "percentage": 97.38, "elapsed_time": "1:06:10", "remaining_time": "0:01:46"}
79
+ {"current_steps": 790, "total_steps": 801, "loss": 0.022, "lr": 2.9496018010233274e-08, "epoch": 2.960150023441163, "percentage": 98.63, "elapsed_time": "1:06:57", "remaining_time": "0:00:55"}
80
+ {"current_steps": 800, "total_steps": 801, "loss": 0.0232, "lr": 8.194905210923143e-10, "epoch": 2.997655883731833, "percentage": 99.88, "elapsed_time": "1:07:44", "remaining_time": "0:00:05"}