Vinitha2004's picture
Upload distilled Qwen2.5-Coder-3B model with knowledge distillation
eee74b7 verified
{
"total_checkpoints": 3,
"best_checkpoint": {
"epoch": 2,
"path": "./models/working_draft/checkpoint_epoch_2",
"val_loss": 1.6648176369258776,
"train_loss": 1.6754711744398976,
"is_best": true
},
"checkpoints": [
{
"epoch": 0,
"path": "./models/working_draft/checkpoint_epoch_0",
"val_loss": 1.6648216817606247,
"train_loss": 1.6754714963588506,
"is_best": false
},
{
"epoch": 1,
"path": "./models/working_draft/checkpoint_epoch_1",
"val_loss": 1.6648264206669057,
"train_loss": 1.6754815220601948,
"is_best": false
},
{
"epoch": 2,
"path": "./models/working_draft/checkpoint_epoch_2",
"val_loss": 1.6648176369258776,
"train_loss": 1.6754711744398976,
"is_best": true
}
],
"training_time_minutes": 100.0129363934199,
"summary_created": "2025-06-13 19:03:52"
}