nroggendorff commited on
Commit
fde7da2
·
verified ·
1 Parent(s): 42c3bab

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -3
app.py CHANGED
@@ -10,7 +10,7 @@ from datasets import load_dataset
10
  from tokenizers import ByteLevelBPETokenizer
11
  import trl
12
 
13
- dataset = load_dataset("nroggendorff/openhermes", split="train")#.select(range(int(4e+5)))
14
 
15
  def get_training_corpus():
16
  for i in range(0, len(dataset), 1000):
@@ -99,8 +99,7 @@ print(dataset['text'][2])
99
  args = TrainingArguments(
100
  output_dir="mayo",
101
  num_train_epochs=2,
102
- gradient_accumulation_steps=16,
103
- per_device_train_batch_size=32,
104
  learning_rate=1e-5,
105
  save_steps=100000,
106
  fp16=True,
 
10
  from tokenizers import ByteLevelBPETokenizer
11
  import trl
12
 
13
+ dataset = load_dataset("nroggendorff/openhermes", split="train").select(range(int(4e+5)))
14
 
15
  def get_training_corpus():
16
  for i in range(0, len(dataset), 1000):
 
99
  args = TrainingArguments(
100
  output_dir="mayo",
101
  num_train_epochs=2,
102
+ per_device_train_batch_size=64,
 
103
  learning_rate=1e-5,
104
  save_steps=100000,
105
  fp16=True,