izzcw commited on
Commit
d98c4c1
·
verified ·
1 Parent(s): e7253db

Training in progress, step 93

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ec42485aab39aeaec2ad62ad2d2f95a40fa574ed1ad787c6806857a77b30199a
3
  size 4976698672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a74d92a6b91f054e3ba3813556e05c2ec5b7647a11b045bdbb4dffd1641b4b32
3
  size 4976698672
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:efb6c3416a76f07024ba9849f70e65c0191f98b4e296b8ab8914ac207044293f
3
  size 4999802720
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5cc1535e9cbaa0e251a238cd4abb4edb363b70bb78e1434339ce336508df6b4a
3
  size 4999802720
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5e4def9d45efd474e4701b75187912d2891b8326d3d0096491ef9b1dbb5e6eea
3
  size 4915916176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:de9d01fb65ea3c10b8d43dc1acb87db03c0429751182a34e42c27111b6eb3e56
3
  size 4915916176
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:25f189ac139cf9f97897763f55cb92195b6e3ae5ef10215e33212b147d86966f
3
  size 1168138808
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9314e462f0427901d8df8087490dadb92db749662871e91c02db309ee8237ded
3
  size 1168138808
trainer_log.jsonl CHANGED
@@ -1,4 +1,11 @@
1
- {"current_steps": 10, "total_steps": 31, "loss": 0.7064, "lr": 8.83022221559489e-06, "epoch": 0.321285140562249, "percentage": 32.26, "elapsed_time": "0:02:32", "remaining_time": "0:05:19"}
2
- {"current_steps": 20, "total_steps": 31, "loss": 0.4659, "lr": 3.5659838364445505e-06, "epoch": 0.642570281124498, "percentage": 64.52, "elapsed_time": "0:05:02", "remaining_time": "0:02:46"}
3
- {"current_steps": 30, "total_steps": 31, "loss": 0.4287, "lr": 3.3808211290284886e-08, "epoch": 0.963855421686747, "percentage": 96.77, "elapsed_time": "0:07:28", "remaining_time": "0:00:14"}
4
- {"current_steps": 31, "total_steps": 31, "epoch": 0.9959839357429718, "percentage": 100.0, "elapsed_time": "0:08:41", "remaining_time": "0:00:00"}
 
 
 
 
 
 
 
 
1
+ {"current_steps": 10, "total_steps": 93, "loss": 0.7327, "lr": 1e-05, "epoch": 0.321285140562249, "percentage": 10.75, "elapsed_time": "0:02:32", "remaining_time": "0:21:09"}
2
+ {"current_steps": 20, "total_steps": 93, "loss": 0.4739, "lr": 9.646090361587828e-06, "epoch": 0.642570281124498, "percentage": 21.51, "elapsed_time": "0:05:03", "remaining_time": "0:18:29"}
3
+ {"current_steps": 30, "total_steps": 93, "loss": 0.4578, "lr": 8.634462259215719e-06, "epoch": 0.963855421686747, "percentage": 32.26, "elapsed_time": "0:07:30", "remaining_time": "0:15:45"}
4
+ {"current_steps": 40, "total_steps": 93, "loss": 0.3057, "lr": 7.10832566725092e-06, "epoch": 1.2570281124497993, "percentage": 43.01, "elapsed_time": "0:09:49", "remaining_time": "0:13:00"}
5
+ {"current_steps": 50, "total_steps": 93, "loss": 0.2544, "lr": 5.2837263654653715e-06, "epoch": 1.5783132530120483, "percentage": 53.76, "elapsed_time": "0:12:19", "remaining_time": "0:10:35"}
6
+ {"current_steps": 50, "total_steps": 93, "eval_loss": 0.3807889521121979, "epoch": 1.5783132530120483, "percentage": 53.76, "elapsed_time": "0:12:22", "remaining_time": "0:10:38"}
7
+ {"current_steps": 60, "total_steps": 93, "loss": 0.2408, "lr": 3.4189616655158803e-06, "epoch": 1.8995983935742973, "percentage": 64.52, "elapsed_time": "0:14:48", "remaining_time": "0:08:08"}
8
+ {"current_steps": 70, "total_steps": 93, "loss": 0.1671, "lr": 1.7780148476756148e-06, "epoch": 2.1927710843373496, "percentage": 75.27, "elapsed_time": "0:17:04", "remaining_time": "0:05:36"}
9
+ {"current_steps": 80, "total_steps": 93, "loss": 0.1015, "lr": 5.931846699267558e-07, "epoch": 2.5140562248995986, "percentage": 86.02, "elapsed_time": "0:19:32", "remaining_time": "0:03:10"}
10
+ {"current_steps": 90, "total_steps": 93, "loss": 0.0912, "lr": 3.220026018407541e-08, "epoch": 2.835341365461847, "percentage": 96.77, "elapsed_time": "0:22:00", "remaining_time": "0:00:44"}
11
+ {"current_steps": 93, "total_steps": 93, "epoch": 2.931726907630522, "percentage": 100.0, "elapsed_time": "0:23:41", "remaining_time": "0:00:00"}
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6279e399ebb998f96e9b816afdafdba5e6cbe3c1188709ebbbae613fa676206c
3
  size 7544
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aedb4d0adc657e20b6b4f80ac4bd9cf3383db799fe4c229251d750d6c5b80a04
3
  size 7544