Spaces:

nroggendorff
/

train-llama

Runtime error

nroggendorff commited on Aug 5, 2024

Commit

b1e38e3

verified ·

1 Parent(s): e001176

Update train.py

Files changed (1) hide show

train.py CHANGED Viewed

@@ -8,11 +8,11 @@ from datasets import load_dataset, DatasetDict, Dataset
 from tokenizers import ByteLevelBPETokenizer
 MAX_SEQ_LENGTH = 128
-BATCH_SIZE = 64
 EPOCHS = 2
-LEARNING_RATE = 1e-4
 FACTOR = 1024
-VOCAB_SIZE = 3200
 INPUT_DATASET = "HuggingFaceTB/smollm-corpus"
 INSTRUCT_DATASET = "nroggendorff/openhermes"
 OUTPUT_REPO = "smallama"

 from tokenizers import ByteLevelBPETokenizer
 MAX_SEQ_LENGTH = 128
+BATCH_SIZE = 16
 EPOCHS = 2
+LEARNING_RATE = 1e-3
 FACTOR = 1024
+VOCAB_SIZE = 32000
 INPUT_DATASET = "HuggingFaceTB/smollm-corpus"
 INSTRUCT_DATASET = "nroggendorff/openhermes"
 OUTPUT_REPO = "smallama"