FatCat87 commited on
Commit
11c42d6
·
verified ·
1 Parent(s): 1372ca6

Training in progress, step 6

Browse files
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:855d3ef8e703db5cbd18b22f1654123853cbc6a09f21ce4a327eadbe313de010
3
  size 159967880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c0a943fca0e94e7e8006736d302cdaca949111c938556cbcc4729707a0ffeaf
3
  size 159967880
config.json CHANGED
@@ -14,7 +14,7 @@
14
  "initializer_range": 0.02,
15
  "intermediate_size": 11008,
16
  "max_length": 4096,
17
- "max_position_embeddings": 2048,
18
  "mlp_bias": false,
19
  "model_type": "llama",
20
  "num_attention_heads": 32,
@@ -27,7 +27,7 @@
27
  "rope_theta": 10000.0,
28
  "tie_word_embeddings": false,
29
  "torch_dtype": "float16",
30
- "transformers_version": "4.48.1",
31
  "use_cache": false,
32
  "vocab_size": 46336
33
  }
 
14
  "initializer_range": 0.02,
15
  "intermediate_size": 11008,
16
  "max_length": 4096,
17
+ "max_position_embeddings": 4096,
18
  "mlp_bias": false,
19
  "model_type": "llama",
20
  "num_attention_heads": 32,
 
27
  "rope_theta": 10000.0,
28
  "tie_word_embeddings": false,
29
  "torch_dtype": "float16",
30
+ "transformers_version": "4.46.3",
31
  "use_cache": false,
32
  "vocab_size": 46336
33
  }
tokenizer_config.json CHANGED
@@ -71,7 +71,6 @@
71
  "bos_token": "<s>",
72
  "clean_up_tokenization_spaces": false,
73
  "eos_token": "</s>",
74
- "extra_special_tokens": {},
75
  "legacy": false,
76
  "model_max_length": 1000000000000000019884624838656,
77
  "pad_token": "</s>",
 
71
  "bos_token": "<s>",
72
  "clean_up_tokenization_spaces": false,
73
  "eos_token": "</s>",
 
74
  "legacy": false,
75
  "model_max_length": 1000000000000000019884624838656,
76
  "pad_token": "</s>",
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f4f0529a4ec5700e384743cbdf1b663399ea3e9152f91ce196042e0be4e12915
3
- size 6520
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8f72a47124e638e8e41619a2dae021e86edc0680b71921e6223382dd20d1c72
3
+ size 6392