Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4877660776
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:90b65b63736bead58745658fe9df5201dfa918935ea409e502169de1deffbe4e
|
3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4932751008
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c6b73221df4e61b97f0b8d310a4a0864c7eb7f83627885f50dcd963c5a73d11b
|
3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4330865200
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fd9f35c366efec1be696765ea92b262425a0b41ae99d97497b326d96430008ef
|
3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1089994880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:997be707776442bbc04715472fbc827968063e78477a4060845a4f806cb1e597
|
3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
@@ -6,3 +6,8 @@
|
|
6 |
{"current_steps": 60, "total_steps": 138, "loss": 0.8491, "lr": 6.971779275566593e-06, "epoch": 1.281081081081081, "percentage": 43.48, "elapsed_time": "0:06:35", "remaining_time": "0:08:34"}
|
7 |
{"current_steps": 70, "total_steps": 138, "loss": 0.8344, "lr": 5.757138887522884e-06, "epoch": 1.4972972972972973, "percentage": 50.72, "elapsed_time": "0:07:17", "remaining_time": "0:07:05"}
|
8 |
{"current_steps": 80, "total_steps": 138, "loss": 0.8397, "lr": 4.49415839006284e-06, "epoch": 1.7135135135135136, "percentage": 57.97, "elapsed_time": "0:08:00", "remaining_time": "0:05:48"}
|
|
|
|
|
|
|
|
|
|
|
|
6 |
{"current_steps": 60, "total_steps": 138, "loss": 0.8491, "lr": 6.971779275566593e-06, "epoch": 1.281081081081081, "percentage": 43.48, "elapsed_time": "0:06:35", "remaining_time": "0:08:34"}
|
7 |
{"current_steps": 70, "total_steps": 138, "loss": 0.8344, "lr": 5.757138887522884e-06, "epoch": 1.4972972972972973, "percentage": 50.72, "elapsed_time": "0:07:17", "remaining_time": "0:07:05"}
|
8 |
{"current_steps": 80, "total_steps": 138, "loss": 0.8397, "lr": 4.49415839006284e-06, "epoch": 1.7135135135135136, "percentage": 57.97, "elapsed_time": "0:08:00", "remaining_time": "0:05:48"}
|
9 |
+
{"current_steps": 90, "total_steps": 138, "loss": 0.8296, "lr": 3.2634737357758994e-06, "epoch": 1.9297297297297298, "percentage": 65.22, "elapsed_time": "0:08:41", "remaining_time": "0:04:38"}
|
10 |
+
{"current_steps": 100, "total_steps": 138, "loss": 0.7802, "lr": 2.1436589245260375e-06, "epoch": 2.1297297297297297, "percentage": 72.46, "elapsed_time": "0:12:09", "remaining_time": "0:04:37"}
|
11 |
+
{"current_steps": 110, "total_steps": 138, "loss": 0.7006, "lr": 1.2062093865360458e-06, "epoch": 2.345945945945946, "percentage": 79.71, "elapsed_time": "0:12:51", "remaining_time": "0:03:16"}
|
12 |
+
{"current_steps": 120, "total_steps": 138, "loss": 0.6986, "lr": 5.109773021462921e-07, "epoch": 2.562162162162162, "percentage": 86.96, "elapsed_time": "0:13:34", "remaining_time": "0:02:02"}
|
13 |
+
{"current_steps": 130, "total_steps": 138, "loss": 0.6844, "lr": 1.0235029373752758e-07, "epoch": 2.7783783783783784, "percentage": 94.2, "elapsed_time": "0:14:16", "remaining_time": "0:00:52"}
|