qwen-coder-1.5B-Instruct-AWQ-t2 / checkpoints_summary.json
Vinitha2004's picture
Upload distilled Qwen2.5-Coder-3B model with knowledge distillation
6eaddc2 verified
{
"total_checkpoints": 3,
"best_checkpoint": {
"epoch": 2,
"path": "./models/working_draft/checkpoint_epoch_2",
"val_loss": 1.9706446496658447,
"train_loss": 1.9690602091820009,
"is_best": true
},
"checkpoints": [
{
"epoch": 0,
"path": "./models/working_draft/checkpoint_epoch_0",
"val_loss": 1.9706641339331337,
"train_loss": 1.9690746277378453,
"is_best": false
},
{
"epoch": 1,
"path": "./models/working_draft/checkpoint_epoch_1",
"val_loss": 1.9706711761400657,
"train_loss": 1.9690665218522472,
"is_best": false
},
{
"epoch": 2,
"path": "./models/working_draft/checkpoint_epoch_2",
"val_loss": 1.9706446496658447,
"train_loss": 1.9690602091820009,
"is_best": true
}
],
"training_time_minutes": 90.36421235005061,
"summary_created": "2025-06-13 12:39:51"
}