{ | |
"training_completed": true, | |
"distillation_method": "knowledge_distillation", | |
"teacher_model": "Qwen/Qwen2.5-Coder-7B-Instruct-AWQ", | |
"student_model": "Qwen/Qwen2.5-Coder-3B-Instruct-AWQ", | |
"best_validation_loss": 1.9286, | |
"optimal_temperature": 2.0, | |
"optimal_alpha": 0.95, | |
"training_samples": 118, | |
"validation_samples": 23, | |
"test_samples": 100 | |
} |