nroggendorff commited on
Commit
aa4a704
·
verified ·
1 Parent(s): 3027af9

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -3
app.py CHANGED
@@ -9,7 +9,7 @@ import requests as rq
9
  import gc
10
  from tokenizers import ByteLevelBPETokenizer
11
 
12
- dataset = load_dataset("nroggendorff/openhermes", split="train").select(range(int(5e+4)))
13
 
14
  def get_training_corpus():
15
  for i in range(0, len(dataset), 1000):
@@ -104,8 +104,7 @@ args = TrainingArguments(
104
  save_steps=100000,
105
  fp16=True,
106
  optim="sgd",
107
- optim_target_modules=["attn", "mlp"],
108
- max_grad_norm=0.3
109
  )
110
 
111
  trainer = trl.SFTTrainer(
 
9
  import gc
10
  from tokenizers import ByteLevelBPETokenizer
11
 
12
+ dataset = load_dataset("nroggendorff/openhermes", split="train")#.select(range(int(5e+4)))
13
 
14
  def get_training_corpus():
15
  for i in range(0, len(dataset), 1000):
 
104
  save_steps=100000,
105
  fp16=True,
106
  optim="sgd",
107
+ optim_target_modules=["attn", "mlp"]
 
108
  )
109
 
110
  trainer = trl.SFTTrainer(