bilkultheek commited on
Commit
3b30e9b
·
verified ·
1 Parent(s): 887a611

Training in progress, step 100

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. README.md +75 -0
  2. adapter_config.json +29 -0
  3. adapter_model.safetensors +3 -0
  4. merges.txt +0 -0
  5. runs/Aug01_10-47-52_fastgpuserv/events.out.tfevents.1722491274.fastgpuserv.2113260.0 +3 -0
  6. runs/Aug01_10-51-09_fastgpuserv/events.out.tfevents.1722491470.fastgpuserv.2113260.1 +3 -0
  7. runs/Aug01_10-55-04_fastgpuserv/events.out.tfevents.1722491706.fastgpuserv.2113260.2 +3 -0
  8. runs/Aug01_11-01-02_fastgpuserv/events.out.tfevents.1722492064.fastgpuserv.2134733.0 +3 -0
  9. runs/Aug01_11-02-42_fastgpuserv/events.out.tfevents.1722492163.fastgpuserv.2134733.1 +3 -0
  10. runs/Aug01_14-05-55_fastgpuserv/events.out.tfevents.1722503158.fastgpuserv.6531.0 +3 -0
  11. runs/Aug01_14-08-57_fastgpuserv/events.out.tfevents.1722503340.fastgpuserv.7077.0 +3 -0
  12. runs/Aug02_12-33-35_fastgpuserv/events.out.tfevents.1722584019.fastgpuserv.3614347.0 +3 -0
  13. runs/Aug02_12-40-23_fastgpuserv/events.out.tfevents.1722584427.fastgpuserv.3637409.0 +3 -0
  14. runs/Aug02_12-42-43_fastgpuserv/events.out.tfevents.1722584567.fastgpuserv.3645427.0 +3 -0
  15. runs/Aug02_12-44-23_fastgpuserv/events.out.tfevents.1722584667.fastgpuserv.3650795.0 +3 -0
  16. runs/Aug02_12-45-52_fastgpuserv/events.out.tfevents.1722584756.fastgpuserv.3655138.0 +3 -0
  17. runs/Aug02_13-00-24_fastgpuserv/events.out.tfevents.1722585628.fastgpuserv.3689700.0 +3 -0
  18. runs/Aug02_13-04-57_fastgpuserv/events.out.tfevents.1722585901.fastgpuserv.3707066.0 +3 -0
  19. runs/Aug02_13-07-01_fastgpuserv/events.out.tfevents.1722586024.fastgpuserv.3714303.0 +3 -0
  20. runs/Aug02_13-07-01_fastgpuserv/events.out.tfevents.1722602007.fastgpuserv.3714303.1 +3 -0
  21. runs/Aug03_09-18-38_fastgpuserv/events.out.tfevents.1722658721.fastgpuserv.2914688.0 +3 -0
  22. runs/Aug03_09-18-38_fastgpuserv/events.out.tfevents.1722690531.fastgpuserv.2914688.1 +3 -0
  23. runs/Aug03_19-02-16_fastgpuserv/events.out.tfevents.1722693740.fastgpuserv.394929.0 +3 -0
  24. runs/Aug03_19-10-35_fastgpuserv/events.out.tfevents.1722694240.fastgpuserv.394929.1 +3 -0
  25. runs/Aug03_19-12-52_fastgpuserv/events.out.tfevents.1722694376.fastgpuserv.455047.0 +3 -0
  26. runs/Aug03_19-16-55_fastgpuserv/events.out.tfevents.1722694620.fastgpuserv.465850.0 +3 -0
  27. runs/Aug05_12-18-54_fastgpuserv/events.out.tfevents.1722842340.fastgpuserv.28637.0 +3 -0
  28. runs/Aug05_13-36-34_fastgpuserv/events.out.tfevents.1722846999.fastgpuserv.215798.0 +3 -0
  29. runs/Aug05_13-39-05_fastgpuserv/events.out.tfevents.1722847150.fastgpuserv.246775.0 +3 -0
  30. runs/Aug05_14-04-12_fastgpuserv/events.out.tfevents.1722848657.fastgpuserv.276465.0 +3 -0
  31. runs/Aug05_14-06-34_fastgpuserv/events.out.tfevents.1722848799.fastgpuserv.281870.0 +3 -0
  32. runs/Aug05_14-09-41_fastgpuserv/events.out.tfevents.1722848985.fastgpuserv.286061.0 +3 -0
  33. runs/Aug05_14-13-33_fastgpuserv/events.out.tfevents.1722849219.fastgpuserv.291050.0 +3 -0
  34. runs/Aug05_14-16-08_fastgpuserv/events.out.tfevents.1722849372.fastgpuserv.294415.0 +3 -0
  35. runs/Aug05_14-18-52_fastgpuserv/events.out.tfevents.1722849537.fastgpuserv.297893.0 +3 -0
  36. runs/Aug05_14-27-06_fastgpuserv/events.out.tfevents.1722850031.fastgpuserv.309192.0 +3 -0
  37. runs/Aug05_14-29-36_fastgpuserv/events.out.tfevents.1722850181.fastgpuserv.312411.0 +3 -0
  38. runs/Aug05_14-31-54_fastgpuserv/events.out.tfevents.1722850319.fastgpuserv.315403.0 +3 -0
  39. runs/Aug05_15-50-27_fastgpuserv/events.out.tfevents.1722855031.fastgpuserv.406263.0 +3 -0
  40. runs/Aug05_16-00-14_fastgpuserv/events.out.tfevents.1722855618.fastgpuserv.417848.0 +3 -0
  41. runs/Aug05_16-40-09_fastgpuserv/events.out.tfevents.1722858014.fastgpuserv.478008.0 +3 -0
  42. runs/Aug05_17-01-54_fastgpuserv/events.out.tfevents.1722859322.fastgpuserv.478008.1 +3 -0
  43. runs/Aug08_10-31-05_fastgpuserv/events.out.tfevents.1723095078.fastgpuserv.1098581.0 +3 -0
  44. runs/Aug08_10-45-37_fastgpuserv/events.out.tfevents.1723095944.fastgpuserv.1098581.1 +3 -0
  45. runs/Aug08_10-48-19_fastgpuserv/events.out.tfevents.1723096106.fastgpuserv.1182703.0 +3 -0
  46. runs/Aug08_11-32-43_fastgpuserv/events.out.tfevents.1723098770.fastgpuserv.1288433.0 +3 -0
  47. special_tokens_map.json +24 -0
  48. tokenizer.json +0 -0
  49. tokenizer.model +3 -0
  50. tokenizer_config.json +41 -0
README.md ADDED
@@ -0,0 +1,75 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ base_model: ahxt/LiteLlama-460M-1T
3
+ library_name: peft
4
+ license: mit
5
+ tags:
6
+ - trl
7
+ - sft
8
+ - generated_from_trainer
9
+ model-index:
10
+ - name: ColdLLamaLite
11
+ results: []
12
+ ---
13
+
14
+ <!-- This model card has been generated automatically according to the information the Trainer had access to. You
15
+ should probably proofread and complete it, then remove this comment. -->
16
+
17
+ # ColdLLamaLite
18
+
19
+ This model is a fine-tuned version of [ahxt/LiteLlama-460M-1T](https://huggingface.co/ahxt/LiteLlama-460M-1T) on the None dataset.
20
+ It achieves the following results on the evaluation set:
21
+ - Loss: 2.0471
22
+
23
+ ## Model description
24
+
25
+ More information needed
26
+
27
+ ## Intended uses & limitations
28
+
29
+ More information needed
30
+
31
+ ## Training and evaluation data
32
+
33
+ More information needed
34
+
35
+ ## Training procedure
36
+
37
+ ### Training hyperparameters
38
+
39
+ The following hyperparameters were used during training:
40
+ - learning_rate: 0.0002
41
+ - train_batch_size: 32
42
+ - eval_batch_size: 32
43
+ - seed: 42
44
+ - gradient_accumulation_steps: 8
45
+ - total_train_batch_size: 256
46
+ - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
47
+ - lr_scheduler_type: cosine
48
+ - lr_scheduler_warmup_ratio: 0.03
49
+ - num_epochs: 10
50
+
51
+ ### Training results
52
+
53
+ | Training Loss | Epoch | Step | Validation Loss |
54
+ |:-------------:|:-----:|:----:|:---------------:|
55
+ | 4.1747 | 0.8 | 25 | 3.9257 |
56
+ | 3.626 | 1.6 | 50 | 3.2474 |
57
+ | 2.8441 | 2.4 | 75 | 2.4490 |
58
+ | 2.3365 | 3.2 | 100 | 2.2482 |
59
+ | 2.2153 | 4.0 | 125 | 2.1758 |
60
+ | 2.1591 | 4.8 | 150 | 2.1316 |
61
+ | 2.1214 | 5.6 | 175 | 2.1011 |
62
+ | 2.0946 | 6.4 | 200 | 2.0781 |
63
+ | 2.0818 | 7.2 | 225 | 2.0622 |
64
+ | 2.0614 | 8.0 | 250 | 2.0528 |
65
+ | 2.0571 | 8.8 | 275 | 2.0485 |
66
+ | 2.0522 | 9.6 | 300 | 2.0471 |
67
+
68
+
69
+ ### Framework versions
70
+
71
+ - PEFT 0.12.0
72
+ - Transformers 4.43.3
73
+ - Pytorch 2.3.1+cu121
74
+ - Datasets 2.17.0
75
+ - Tokenizers 0.19.1
adapter_config.json ADDED
@@ -0,0 +1,29 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "alpha_pattern": {},
3
+ "auto_mapping": null,
4
+ "base_model_name_or_path": "NousResearch/Llama-2-7b-hf",
5
+ "bias": "none",
6
+ "fan_in_fan_out": false,
7
+ "inference_mode": true,
8
+ "init_lora_weights": true,
9
+ "layer_replication": null,
10
+ "layers_pattern": null,
11
+ "layers_to_transform": null,
12
+ "loftq_config": {},
13
+ "lora_alpha": 16,
14
+ "lora_dropout": 0.1,
15
+ "megatron_config": null,
16
+ "megatron_core": "megatron.core",
17
+ "modules_to_save": null,
18
+ "peft_type": "LORA",
19
+ "r": 64,
20
+ "rank_pattern": {},
21
+ "revision": null,
22
+ "target_modules": [
23
+ "q_proj",
24
+ "v_proj"
25
+ ],
26
+ "task_type": "CAUSAL_LM",
27
+ "use_dora": false,
28
+ "use_rslora": false
29
+ }
adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d53bd3a1801373da013ab4d28c27937c0cba54179a47ba85236eb09984317cf
3
+ size 134235048
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
runs/Aug01_10-47-52_fastgpuserv/events.out.tfevents.1722491274.fastgpuserv.2113260.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aea32443cb43711c1a8f3b9a7c6fbfc180424cf50862b663ddfcd0468dd88a28
3
+ size 5752
runs/Aug01_10-51-09_fastgpuserv/events.out.tfevents.1722491470.fastgpuserv.2113260.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:89db4b1d7228307280aa3594178c3b17922ad3e04d1b2446a8e2ec2aebc66615
3
+ size 5753
runs/Aug01_10-55-04_fastgpuserv/events.out.tfevents.1722491706.fastgpuserv.2113260.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:034df33b3f1320467f8fc105405fffe445e701405a84ac31a39ad367bebcad98
3
+ size 5752
runs/Aug01_11-01-02_fastgpuserv/events.out.tfevents.1722492064.fastgpuserv.2134733.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e6f63a830d193f53344febcc33dfa34ab61f00285032e3878af71b493ddde937
3
+ size 5753
runs/Aug01_11-02-42_fastgpuserv/events.out.tfevents.1722492163.fastgpuserv.2134733.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4cb01cadc06f59c43c9f071f8a399a5ffb04867d74ead76ccb43c6ca702eb777
3
+ size 12697
runs/Aug01_14-05-55_fastgpuserv/events.out.tfevents.1722503158.fastgpuserv.6531.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:210ecb64a0f7832fb67fe3c9c5b4bb675f3820b2fc78ab7939d5fbbe5c6f8617
3
+ size 4184
runs/Aug01_14-08-57_fastgpuserv/events.out.tfevents.1722503340.fastgpuserv.7077.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fca9054c067e0196ed042b95af7a47122046e9703ad44707d016c515df877980
3
+ size 11399
runs/Aug02_12-33-35_fastgpuserv/events.out.tfevents.1722584019.fastgpuserv.3614347.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a0c6f10b29f06bafa4219869f62edd74ac2ee0c026ba695487291d5d021d45dc
3
+ size 5788
runs/Aug02_12-40-23_fastgpuserv/events.out.tfevents.1722584427.fastgpuserv.3637409.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:04572ddc12c1592d208edd2336f0e79faa38698d2d3ec790a37da0bcc55790fe
3
+ size 4184
runs/Aug02_12-42-43_fastgpuserv/events.out.tfevents.1722584567.fastgpuserv.3645427.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:942580e7674d76e0a7a957d2920080d65193d6d201bbe5cf2368600e63ea844c
3
+ size 5788
runs/Aug02_12-44-23_fastgpuserv/events.out.tfevents.1722584667.fastgpuserv.3650795.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fba86a4d41e64ccaa9035bfab269568d501df25402abc25104a4b7b802172548
3
+ size 5788
runs/Aug02_12-45-52_fastgpuserv/events.out.tfevents.1722584756.fastgpuserv.3655138.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2fb7f2f39d539a2cb3a8ebc962b81040f5f9c2098322a1dc910de94df9d8247d
3
+ size 5788
runs/Aug02_13-00-24_fastgpuserv/events.out.tfevents.1722585628.fastgpuserv.3689700.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:962181f37b84fc09c9d5d465d9486947537ccde5d8879b3c9b91829ebab08902
3
+ size 5792
runs/Aug02_13-04-57_fastgpuserv/events.out.tfevents.1722585901.fastgpuserv.3707066.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f318aa9816b7523059bab4101afe1254434b1b360e65c8eb0d93983ee8ccc4d
3
+ size 4184
runs/Aug02_13-07-01_fastgpuserv/events.out.tfevents.1722586024.fastgpuserv.3714303.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:864b30d31ce12cc86b57b1490237f41dea7afc8cca93868f9902572831cdebef
3
+ size 8992
runs/Aug02_13-07-01_fastgpuserv/events.out.tfevents.1722602007.fastgpuserv.3714303.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d6890949d3abe45db8d962b80fd220ed72f34e906ba435db853a4ad9a61faf49
3
+ size 359
runs/Aug03_09-18-38_fastgpuserv/events.out.tfevents.1722658721.fastgpuserv.2914688.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e33fc634c97733e26c13959db7a058b5ec76841b5b90433ea9bfaf4494eaa3e8
3
+ size 11885
runs/Aug03_09-18-38_fastgpuserv/events.out.tfevents.1722690531.fastgpuserv.2914688.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:01f6462e33b14e20a451c94459665f31bb87ad7d037deac0f025e8b117299d64
3
+ size 359
runs/Aug03_19-02-16_fastgpuserv/events.out.tfevents.1722693740.fastgpuserv.394929.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e80be820f6b425d7b1ade3419aa7ebed0fa56e26199486a7971e1f9e6cc10093
3
+ size 5742
runs/Aug03_19-10-35_fastgpuserv/events.out.tfevents.1722694240.fastgpuserv.394929.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ad6bdc362ad756e8824c0a05ba14a5d3c5644abbef09f806f4998245003397d4
3
+ size 4184
runs/Aug03_19-12-52_fastgpuserv/events.out.tfevents.1722694376.fastgpuserv.455047.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:64749a1f1806ed0b38d9aa08dfe97cda7cc10c768c7ad251d0da1d002963a12c
3
+ size 5744
runs/Aug03_19-16-55_fastgpuserv/events.out.tfevents.1722694620.fastgpuserv.465850.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d432579479b086b6442b0e55c95ba3fd986c71afef1d06a197a802d35d6af272
3
+ size 14349
runs/Aug05_12-18-54_fastgpuserv/events.out.tfevents.1722842340.fastgpuserv.28637.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f111aca075a854c84aec9eab09bd17e7d70a72d5b4d3914245804a0d37453dc
3
+ size 5754
runs/Aug05_13-36-34_fastgpuserv/events.out.tfevents.1722846999.fastgpuserv.215798.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aaf3f30f544111fcd16a032d304d98b7cc6c0600defbb43de1ff5001f5a493a2
3
+ size 4184
runs/Aug05_13-39-05_fastgpuserv/events.out.tfevents.1722847150.fastgpuserv.246775.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:85df9b07446befdf5e8b91488074d17bd2ccc2782972901c87fa50a6e7cea2c9
3
+ size 5777
runs/Aug05_14-04-12_fastgpuserv/events.out.tfevents.1722848657.fastgpuserv.276465.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d112e8f7ef34e8a09c422bdf6704c2dcc5b33e2b4370e479b8c5deb6fdeeae7
3
+ size 4184
runs/Aug05_14-06-34_fastgpuserv/events.out.tfevents.1722848799.fastgpuserv.281870.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9e87211b95831ba800271a1eb4d14b6e7133b58f355cc3cd1d9ea1fa23793a4b
3
+ size 5778
runs/Aug05_14-09-41_fastgpuserv/events.out.tfevents.1722848985.fastgpuserv.286061.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed4d24984935628451eb82a76ca0658c25edd73f65625252615bcc9dcfa5179d
3
+ size 5778
runs/Aug05_14-13-33_fastgpuserv/events.out.tfevents.1722849219.fastgpuserv.291050.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a18a2ffa2b324fa0fe65f9a75c99867066853739b7a30b876a278659a1c8bc79
3
+ size 5779
runs/Aug05_14-16-08_fastgpuserv/events.out.tfevents.1722849372.fastgpuserv.294415.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6a3bd113966ba028f054ac0bdad2f3598a1997df638fa023334947393e342d48
3
+ size 4184
runs/Aug05_14-18-52_fastgpuserv/events.out.tfevents.1722849537.fastgpuserv.297893.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fcd330d8adfb970a561d84e6a3376260e45650e373721ebf35b3d19217f51df5
3
+ size 5779
runs/Aug05_14-27-06_fastgpuserv/events.out.tfevents.1722850031.fastgpuserv.309192.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:69f68c82bffddf63c61e8a491920fff6208ff1e5392fa845d01e8936768e82d3
3
+ size 5779
runs/Aug05_14-29-36_fastgpuserv/events.out.tfevents.1722850181.fastgpuserv.312411.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4487b7fc29b7be3fd9c234d57e94f4bde4a4f35d41fa6b29451249c400acad75
3
+ size 5779
runs/Aug05_14-31-54_fastgpuserv/events.out.tfevents.1722850319.fastgpuserv.315403.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:989b926716f67a5e657ce5214fcbb8dae8e8c68888b17d3b2d6b0f1148a374d2
3
+ size 6193
runs/Aug05_15-50-27_fastgpuserv/events.out.tfevents.1722855031.fastgpuserv.406263.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2c5a001a3349896d328d95c512ff2c2b61b4ddf43f015cf023be78345abbdc4f
3
+ size 5779
runs/Aug05_16-00-14_fastgpuserv/events.out.tfevents.1722855618.fastgpuserv.417848.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb98cf51d681f8fba28fcb5002ad1908724a2e57a209a69583affc8888f5bd2b
3
+ size 5779
runs/Aug05_16-40-09_fastgpuserv/events.out.tfevents.1722858014.fastgpuserv.478008.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1f55b368490a79a655d0062a40cfc703c7e925e7d2c8268b7d2034f201ecc5cb
3
+ size 5779
runs/Aug05_17-01-54_fastgpuserv/events.out.tfevents.1722859322.fastgpuserv.478008.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:07c25d302a2f9e3cca0d7c61495d800bf6f82b1d7c87c8bae41cf04df1635e02
3
+ size 29392
runs/Aug08_10-31-05_fastgpuserv/events.out.tfevents.1723095078.fastgpuserv.1098581.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:499c61b4d2cedce67297476f77295aed93d70bad5402e8e3b3b7b66a655d6c1f
3
+ size 5776
runs/Aug08_10-45-37_fastgpuserv/events.out.tfevents.1723095944.fastgpuserv.1098581.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3b0640da445457a7c7416168f1a3b4364f4f0242a496f705126ec21f635b2ba8
3
+ size 5777
runs/Aug08_10-48-19_fastgpuserv/events.out.tfevents.1723096106.fastgpuserv.1182703.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b2978c6ad3b33a05b8c14f7648fcb95ed3055309cb891bd854334809e3df64cc
3
+ size 5984
runs/Aug08_11-32-43_fastgpuserv/events.out.tfevents.1723098770.fastgpuserv.1288433.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:98af3c1112f57e6b132649b742b946c3b7ad4d09d3dd594d2f7369960df07692
3
+ size 7846
special_tokens_map.json ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": {
3
+ "content": "<s>",
4
+ "lstrip": false,
5
+ "normalized": true,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "eos_token": {
10
+ "content": "</s>",
11
+ "lstrip": false,
12
+ "normalized": true,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "pad_token": "</s>",
17
+ "unk_token": {
18
+ "content": "<unk>",
19
+ "lstrip": false,
20
+ "normalized": true,
21
+ "rstrip": false,
22
+ "single_word": false
23
+ }
24
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9e556afd44213b6bd1be2b850ebbbd98f5481437a8021afaf58ee7fb1818d347
3
+ size 499723
tokenizer_config.json ADDED
@@ -0,0 +1,41 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_bos_token": true,
3
+ "add_eos_token": false,
4
+ "add_prefix_space": null,
5
+ "added_tokens_decoder": {
6
+ "0": {
7
+ "content": "<unk>",
8
+ "lstrip": false,
9
+ "normalized": true,
10
+ "rstrip": false,
11
+ "single_word": false,
12
+ "special": true
13
+ },
14
+ "1": {
15
+ "content": "<s>",
16
+ "lstrip": false,
17
+ "normalized": true,
18
+ "rstrip": false,
19
+ "single_word": false,
20
+ "special": true
21
+ },
22
+ "2": {
23
+ "content": "</s>",
24
+ "lstrip": false,
25
+ "normalized": true,
26
+ "rstrip": false,
27
+ "single_word": false,
28
+ "special": true
29
+ }
30
+ },
31
+ "bos_token": "<s>",
32
+ "clean_up_tokenization_spaces": false,
33
+ "eos_token": "</s>",
34
+ "legacy": false,
35
+ "model_max_length": 1000000000000000019884624838656,
36
+ "pad_token": "</s>",
37
+ "sp_model_kwargs": {},
38
+ "tokenizer_class": "LlamaTokenizer",
39
+ "unk_token": "<unk>",
40
+ "use_default_system_prompt": false
41
+ }