Vinitha2004's picture
Upload distilled Qwen2.5-Coder-3B model with knowledge distillation
eee74b7 verified
{
"model_type": "validated_distilled_draft",
"frontier_model": "Qwen/Qwen2.5-Coder-7B-Instruct-AWQ",
"draft_model": "Qwen/Qwen2.5-Coder-3B-Instruct-AWQ",
"training_time_minutes": 100.0129363934199,
"best_val_loss": 1.6648176369258776,
"best_epoch": 3,
"final_temperature": 2.0,
"final_alpha": 0.95,
"epochs_completed": 3,
"early_stopped": false,
"total_checkpoints_saved": 3,
"save_all_checkpoints": true,
"save_validation_info": true,
"completion_time": "2025-06-13 19:03:53",
"checkpoint_paths": [
"./models/working_draft/checkpoint_epoch_0",
"./models/working_draft/checkpoint_epoch_1",
"./models/working_draft/checkpoint_epoch_2"
],
"best_checkpoint_epoch": 3
}