File size: 364 Bytes
88eee7d |
1 2 3 4 5 6 7 8 9 10 11 12 |
{
"training_completed": true,
"distillation_method": "knowledge_distillation",
"teacher_model": "Qwen/Qwen2.5-Coder-7B-Instruct-AWQ",
"student_model": "Qwen/Qwen2.5-Coder-3B-Instruct-AWQ",
"best_validation_loss": 1.9286,
"optimal_temperature": 2.0,
"optimal_alpha": 0.95,
"training_samples": 118,
"validation_samples": 23,
"test_samples": 100
} |