| { | |
| "base_model": "microsoft/Phi-3-mini-4k-instruct", | |
| "domains": [ | |
| "ambiguous", | |
| "api_generation", | |
| "business", | |
| "coding", | |
| "creative_content", | |
| "data_analysis", | |
| "education", | |
| "general_knowledge", | |
| "geography", | |
| "history", | |
| "law", | |
| "literature", | |
| "mathematics", | |
| "medicine", | |
| "science", | |
| "sensitive", | |
| "technology" | |
| ], | |
| "num_domains": 17, | |
| "training_samples": 3666, | |
| "multi_domain_samples": 516, | |
| "training_config": { | |
| "num_epochs": 5, | |
| "batch_size": 16, | |
| "learning_rate": 0.0002, | |
| "warmup_ratio": 0.1, | |
| "weight_decay": 0.01, | |
| "gradient_accumulation_steps": 2, | |
| "eval_steps": 50, | |
| "save_steps": 100, | |
| "logging_steps": 10 | |
| }, | |
| "lora_config": { | |
| "r": 32, | |
| "lora_alpha": 64, | |
| "lora_dropout": 0.1, | |
| "target_modules": [ | |
| "qkv_proj", | |
| "o_proj", | |
| "gate_up_proj", | |
| "down_proj" | |
| ] | |
| }, | |
| "training_time_hours": 1.6138046666666666, | |
| "final_loss": 0.14003139210783916 | |
| } |