Update README.md
Browse files
README.md
CHANGED
|
@@ -14,15 +14,25 @@ tags: []
|
|
| 14 |
### Model Description
|
| 15 |
|
| 16 |
MaxLen: 1500
|
|
|
|
| 17 |
Dataset: final_dataset_2.json
|
|
|
|
| 18 |
batch_size: 4
|
|
|
|
| 19 |
num_epochs: 4 (eq. 2)
|
|
|
|
| 20 |
checkpoint: 180
|
|
|
|
| 21 |
LoRa r = 384
|
|
|
|
| 22 |
target_modules = [
|
|
|
|
| 23 |
"query_proj", "key_proj", "value_proj", "dense",
|
|
|
|
| 24 |
"linear_1", "linear_2",
|
|
|
|
| 25 |
"mlp.0", "mlp.2", "mlp.4"
|
|
|
|
| 26 |
]
|
| 27 |
|
| 28 |
|
|
|
|
| 14 |
### Model Description
|
| 15 |
|
| 16 |
MaxLen: 1500
|
| 17 |
+
|
| 18 |
Dataset: final_dataset_2.json
|
| 19 |
+
|
| 20 |
batch_size: 4
|
| 21 |
+
|
| 22 |
num_epochs: 4 (eq. 2)
|
| 23 |
+
|
| 24 |
checkpoint: 180
|
| 25 |
+
|
| 26 |
LoRa r = 384
|
| 27 |
+
|
| 28 |
target_modules = [
|
| 29 |
+
|
| 30 |
"query_proj", "key_proj", "value_proj", "dense",
|
| 31 |
+
|
| 32 |
"linear_1", "linear_2",
|
| 33 |
+
|
| 34 |
"mlp.0", "mlp.2", "mlp.4"
|
| 35 |
+
|
| 36 |
]
|
| 37 |
|
| 38 |
|