prosecalign
/

phi3m0128-wds-0.9-kendall-onof-ofif-corr-max-2-simpo-max1500-default

Transformers

Safetensors

Generated from Trainer

llama-factory

Model card Files Files and versions Community

ziansu commited on Jan 31

Commit

5e704c7

verified ·

1 Parent(s): 0f2f4cd

Training in progress, step 1350

Browse files

Files changed (2) hide show

adapter_model.safetensors +1 -1
trainer_log.jsonl +6 -0

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6742ad596b004d6eb1f1542280e5955260247e1c2fba2da5c8cd6199fad48ffa
 size 25200088

 version https://git-lfs.github.com/spec/v1
+oid sha256:b593941f34d1b2a8e6b529cd2ffa7fdffdb5210951b4bd66051c21793f2fc75f
 size 25200088

trainer_log.jsonl CHANGED Viewed

@@ -154,3 +154,9 @@
 {"current_steps": 1290, "total_steps": 1500, "loss": 0.2191, "accuracy": 0.9624999761581421, "learning_rate": 2.3793236883495164e-07, "epoch": 1.0419778002018163, "percentage": 86.0, "elapsed_time": "3:01:26", "remaining_time": "0:29:32", "throughput": "0.00", "total_tokens": 0}
 {"current_steps": 1300, "total_steps": 1500, "loss": 0.1877, "accuracy": 0.925000011920929, "learning_rate": 2.1613635589349756e-07, "epoch": 1.050050454086781, "percentage": 86.67, "elapsed_time": "3:02:45", "remaining_time": "0:28:06", "throughput": "0.00", "total_tokens": 0}
 {"current_steps": 1300, "total_steps": 1500, "eval_loss": 0.2025279700756073, "epoch": 1.050050454086781, "percentage": 86.67, "elapsed_time": "3:03:15", "remaining_time": "0:28:11", "throughput": "0.00", "total_tokens": 0}

 {"current_steps": 1290, "total_steps": 1500, "loss": 0.2191, "accuracy": 0.9624999761581421, "learning_rate": 2.3793236883495164e-07, "epoch": 1.0419778002018163, "percentage": 86.0, "elapsed_time": "3:01:26", "remaining_time": "0:29:32", "throughput": "0.00", "total_tokens": 0}
 {"current_steps": 1300, "total_steps": 1500, "loss": 0.1877, "accuracy": 0.925000011920929, "learning_rate": 2.1613635589349756e-07, "epoch": 1.050050454086781, "percentage": 86.67, "elapsed_time": "3:02:45", "remaining_time": "0:28:06", "throughput": "0.00", "total_tokens": 0}
 {"current_steps": 1300, "total_steps": 1500, "eval_loss": 0.2025279700756073, "epoch": 1.050050454086781, "percentage": 86.67, "elapsed_time": "3:03:15", "remaining_time": "0:28:11", "throughput": "0.00", "total_tokens": 0}
+{"current_steps": 1310, "total_steps": 1500, "loss": 0.2232, "accuracy": 0.9624999761581421, "learning_rate": 1.95342121028749e-07, "epoch": 1.0581231079717457, "percentage": 87.33, "elapsed_time": "3:04:38", "remaining_time": "0:26:46", "throughput": "0.00", "total_tokens": 0}
+{"current_steps": 1320, "total_steps": 1500, "loss": 0.1756, "accuracy": 0.9375, "learning_rate": 1.7555878527937164e-07, "epoch": 1.0661957618567104, "percentage": 88.0, "elapsed_time": "3:05:56", "remaining_time": "0:25:21", "throughput": "0.00", "total_tokens": 0}
+{"current_steps": 1330, "total_steps": 1500, "loss": 0.1806, "accuracy": 0.949999988079071, "learning_rate": 1.567950262702714e-07, "epoch": 1.074268415741675, "percentage": 88.67, "elapsed_time": "3:07:16", "remaining_time": "0:23:56", "throughput": "0.00", "total_tokens": 0}
+{"current_steps": 1340, "total_steps": 1500, "loss": 0.1918, "accuracy": 0.9624999761581421, "learning_rate": 1.3905907440629752e-07, "epoch": 1.0823410696266398, "percentage": 89.33, "elapsed_time": "3:08:34", "remaining_time": "0:22:30", "throughput": "0.00", "total_tokens": 0}
+{"current_steps": 1350, "total_steps": 1500, "loss": 0.1845, "accuracy": 0.949999988079071, "learning_rate": 1.223587092621162e-07, "epoch": 1.0904137235116045, "percentage": 90.0, "elapsed_time": "3:09:50", "remaining_time": "0:21:05", "throughput": "0.00", "total_tokens": 0}
+{"current_steps": 1350, "total_steps": 1500, "eval_loss": 0.20255495607852936, "epoch": 1.0904137235116045, "percentage": 90.0, "elapsed_time": "3:10:20", "remaining_time": "0:21:08", "throughput": "0.00", "total_tokens": 0}