|
{ |
|
"name": "MTA-DeepCode-r32-a32-epoch20", |
|
"base_model": "Qwen/Qwen2.5-Coder-3B-Instruct", |
|
"context_length": 8192, |
|
"model_type": "finetuned", |
|
"finetune_steps": [ |
|
{ |
|
"base_model": "Qwen/Qwen2.5-Coder-3B-Instruct", |
|
"step": 1, |
|
"data": "MTA-project", |
|
"epochs": 20, |
|
"batch_size": 16, |
|
"dataset_size": 5420, |
|
"num_tests": "" |
|
} |
|
], |
|
"project": "MTA", |
|
"prompt_template": { |
|
"user_tag": "<|start_header_id|>user<|end_header_id|>", |
|
"end_tag": "<|eot_id|>", |
|
"assistant_tag": "<|start_header_id|>assistant<|end_header_id|>" |
|
} |
|
} |