|
task: extractive-qa |
|
base_model: ft:gpt-4o-2024-08-06:raiffs-bits:codettev7:B7vPpFBj |
|
project_name: proj_qBLEJleU9G2KjNQCBvemjfRh |
|
log: tensorboard |
|
backend: local |
|
|
|
data: |
|
path: data/ |
|
train_split: train |
|
valid_split: valid |
|
column_mapping: |
|
text_column: context |
|
question_column: question |
|
answer_column: answers |
|
|
|
params: |
|
max_seq_length: 512 |
|
max_doc_stride: 128 |
|
epochs: 3 |
|
batch_size: 4 |
|
lr: 2e-5 |
|
optimizer: adamw_torch |
|
scheduler: linear |
|
gradient_accumulation: 1 |
|
mixed_precision: fp16 |
|
|
|
hub: |
|
username: ${HF_USERNAME} |
|
token: ${HF_TOKEN} |
|
push_to_hub: true |