|
{ |
|
"model_config": { |
|
"architectures": ["PhiForSequenceClassification"], |
|
"model_type": "phi", |
|
"name": "Waggerra/classifier", |
|
"base_model": "microsoft/phi-3", |
|
"fine_tuned": true |
|
}, |
|
"inference_config": { |
|
"temperature": 0.7, |
|
"top_p": 0.9, |
|
"max_length": 2048, |
|
"do_sample": true |
|
}, |
|
"training_config": { |
|
"learning_rate": 2e-5, |
|
"num_train_epochs": 3, |
|
"per_device_train_batch_size": 4, |
|
"gradient_accumulation_steps": 4 |
|
}, |
|
"metadata": { |
|
"author": "Waggerra", |
|
"model_name": "classifier", |
|
"description": "Phi-3 3B model fine-tuned for classification tasks", |
|
"tags": ["classification", "phi-3", "fine-tuned"], |
|
"license": "mit", |
|
"language": ["en"] |
|
} |
|
} |