File size: 364 Bytes
88eee7d
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
{
  "training_completed": true,
  "distillation_method": "knowledge_distillation",
  "teacher_model": "Qwen/Qwen2.5-Coder-7B-Instruct-AWQ",
  "student_model": "Qwen/Qwen2.5-Coder-3B-Instruct-AWQ",
  "best_validation_loss": 1.9286,
  "optimal_temperature": 2.0,
  "optimal_alpha": 0.95,
  "training_samples": 118,
  "validation_samples": 23,
  "test_samples": 100
}