Spaces:
Runtime error
Runtime error
Update app.py
Browse files
app.py
CHANGED
@@ -10,7 +10,7 @@ from datasets import load_dataset
|
|
10 |
from tokenizers import ByteLevelBPETokenizer
|
11 |
import trl
|
12 |
|
13 |
-
dataset = load_dataset("nroggendorff/openhermes", split="train")
|
14 |
|
15 |
def get_training_corpus():
|
16 |
for i in range(0, len(dataset), 1000):
|
@@ -99,8 +99,7 @@ print(dataset['text'][2])
|
|
99 |
args = TrainingArguments(
|
100 |
output_dir="mayo",
|
101 |
num_train_epochs=2,
|
102 |
-
|
103 |
-
per_device_train_batch_size=32,
|
104 |
learning_rate=1e-5,
|
105 |
save_steps=100000,
|
106 |
fp16=True,
|
|
|
10 |
from tokenizers import ByteLevelBPETokenizer
|
11 |
import trl
|
12 |
|
13 |
+
dataset = load_dataset("nroggendorff/openhermes", split="train").select(range(int(4e+5)))
|
14 |
|
15 |
def get_training_corpus():
|
16 |
for i in range(0, len(dataset), 1000):
|
|
|
99 |
args = TrainingArguments(
|
100 |
output_dir="mayo",
|
101 |
num_train_epochs=2,
|
102 |
+
per_device_train_batch_size=64,
|
|
|
103 |
learning_rate=1e-5,
|
104 |
save_steps=100000,
|
105 |
fp16=True,
|