adeelahmad commited on
Commit
c485dbd
·
verified ·
1 Parent(s): df4edb5

Upload 7 files

Browse files
config.json CHANGED
@@ -25,11 +25,11 @@
25
  "pretraining_tp": 1,
26
  "quantization": {
27
  "group_size": 64,
28
- "bits": 4
29
  },
30
  "quantization_config": {
31
  "group_size": 64,
32
- "bits": 4
33
  },
34
  "rms_norm_eps": 1e-05,
35
  "rope_scaling": {
@@ -44,5 +44,5 @@
44
  "torch_dtype": "bfloat16",
45
  "transformers_version": "4.45.0.dev0",
46
  "use_cache": true,
47
- "vocab_size": 128260
48
  }
 
25
  "pretraining_tp": 1,
26
  "quantization": {
27
  "group_size": 64,
28
+ "bits": 8
29
  },
30
  "quantization_config": {
31
  "group_size": 64,
32
+ "bits": 8
33
  },
34
  "rms_norm_eps": 1e-05,
35
  "rope_scaling": {
 
44
  "torch_dtype": "bfloat16",
45
  "transformers_version": "4.45.0.dev0",
46
  "use_cache": true,
47
+ "vocab_size": 128268
48
  }
model-00001-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:35e609513cf73518e0c62f3fd8d6f48a8b37d16b53c0d0716cc3debfab2f2365
3
- size 5368503297
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:005cb9b304b330795eb9b931fb14bd2ce907e5b87b5515caa076e83facf80246
3
+ size 5368552449
model-00002-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f176279ad187d542bdc3ddd63d7d47e217a2aae4b980b10be822ab19f3543fae
3
  size 1057050053
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0aaf0a6076db00ce1cfd609cebfcc393732504db490884a241a6578cec7439ae
3
  size 1057050053
model.safetensors.index.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "metadata": {
3
- "total_size": 6425524224
4
  },
5
  "weight_map": {
6
  "model.embed_tokens.weight": "model-00001-of-00002.safetensors",
 
1
  {
2
  "metadata": {
3
+ "total_size": 6425573376
4
  },
5
  "weight_map": {
6
  "model.embed_tokens.weight": "model-00001-of-00002.safetensors",
special_tokens_map.json CHANGED
@@ -1,9 +1,17 @@
1
  {
2
  "additional_special_tokens": [
3
- "<thinking>",
 
 
 
4
  "</thinking>",
 
5
  "<answer>",
6
- "</answer>"
 
 
 
 
7
  ],
8
  "bos_token": {
9
  "content": "<|begin_of_text|>",
@@ -13,7 +21,14 @@
13
  "single_word": false
14
  },
15
  "eos_token": {
16
- "content": "<|eot_id|>",
 
 
 
 
 
 
 
17
  "lstrip": false,
18
  "normalized": false,
19
  "rstrip": false,
 
1
  {
2
  "additional_special_tokens": [
3
+ "</answer>",
4
+ "</img_base64>",
5
+ "</json_output>",
6
+ "</ocr_text>",
7
  "</thinking>",
8
+ "</tool_code>",
9
  "<answer>",
10
+ "<img_base64>",
11
+ "<json_output>",
12
+ "<ocr_text>",
13
+ "<thinking>",
14
+ "<tool_code>"
15
  ],
16
  "bos_token": {
17
  "content": "<|begin_of_text|>",
 
21
  "single_word": false
22
  },
23
  "eos_token": {
24
+ "content": "<|end_of_text|>",
25
+ "lstrip": false,
26
+ "normalized": false,
27
+ "rstrip": false,
28
+ "single_word": false
29
+ },
30
+ "pad_token": {
31
+ "content": "<|end_of_text|>",
32
  "lstrip": false,
33
  "normalized": false,
34
  "rstrip": false,
tokenizer.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:659b86188dc6339d60c3aebaa90c48dbda63bde0cde4705e6da67bf448acdf9d
3
- size 17210666
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5760aba0c96242f8b528c7e344760e333db5d6d73df8e88b7fdb0ba0ff13fbfa
3
+ size 17212178
tokenizer_config.json CHANGED
@@ -2079,23 +2079,96 @@
2079
  "rstrip": false,
2080
  "single_word": false,
2081
  "special": true
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2082
  }
2083
  },
2084
  "additional_special_tokens": [
2085
- "<thinking>",
 
 
 
2086
  "</thinking>",
 
2087
  "<answer>",
2088
- "</answer>"
 
 
 
 
2089
  ],
2090
  "bos_token": "<|begin_of_text|>",
2091
  "chat_template": "{{- bos_token }}\n{%- if custom_tools is defined %}\n {%- set tools = custom_tools %}\n{%- endif %}\n{%- if not tools_in_user_message is defined %}\n {%- set tools_in_user_message = true %}\n{%- endif %}\n{%- if not date_string is defined %}\n {%- if strftime_now is defined %}\n {%- set date_string = strftime_now(\"%d %b %Y\") %}\n {%- else %}\n {%- set date_string = \"26 Jul 2024\" %}\n {%- endif %}\n{%- endif %}\n{%- if not tools is defined %}\n {%- set tools = none %}\n{%- endif %}\n\n{#- This block extracts the system message, so we can slot it into the right place. #}\n{%- if messages[0]['role'] == 'system' %}\n {%- set system_message = messages[0]['content']|trim %}\n {%- set messages = messages[1:] %}\n{%- else %}\n {%- set system_message = \"\" %}\n{%- endif %}\n\n{#- System message #}\n{{- \"<|start_header_id|>system<|end_header_id|>\\n\\n\" }}\n{%- if tools is not none %}\n {{- \"Environment: ipython\\n\" }}\n{%- endif %}\n{{- \"Cutting Knowledge Date: December 2023\\n\" }}\n{{- \"Today Date: \" + date_string + \"\\n\\n\" }}\n{%- if tools is not none and not tools_in_user_message %}\n {{- \"You have access to the following functions. To call a function, please respond with JSON for a function call.\" }}\n {{- 'Respond in the format {\"name\": function name, \"parameters\": dictionary of argument name and its value}.' }}\n {{- \"Do not use variables.\\n\\n\" }}\n {%- for t in tools %}\n {{- t | tojson(indent=4) }}\n {{- \"\\n\\n\" }}\n {%- endfor %}\n{%- endif %}\n{{- system_message }}\n{{- \"<|eot_id|>\" }}\n\n{#- Custom tools are passed in a user message with some extra guidance #}\n{%- if tools_in_user_message and not tools is none %}\n {#- Extract the first user message so we can plug it in here #}\n {%- if messages | length != 0 %}\n {%- set first_user_message = messages[0]['content']|trim %}\n {%- set messages = messages[1:] %}\n {%- else %}\n {{- raise_exception(\"Cannot put tools in the first user message when there's no first user message!\") }}\n{%- endif %}\n {{- '<|start_header_id|>user<|end_header_id|>\\n\\n' -}}\n {{- \"Given the following functions, please respond with a JSON for a function call \" }}\n {{- \"with its proper arguments that best answers the given prompt.\\n\\n\" }}\n {{- 'Respond in the format {\"name\": function name, \"parameters\": dictionary of argument name and its value}.' }}\n {{- \"Do not use variables.\\n\\n\" }}\n {%- for t in tools %}\n {{- t | tojson(indent=4) }}\n {{- \"\\n\\n\" }}\n {%- endfor %}\n {{- first_user_message + \"<|eot_id|>\"}}\n{%- endif %}\n\n{%- for message in messages %}\n {%- if not (message.role == 'ipython' or message.role == 'tool' or 'tool_calls' in message) %}\n {{- '<|start_header_id|>' + message['role'] + '<|end_header_id|>\\n\\n'+ message['content'] | trim + '<|eot_id|>' }}\n {%- elif 'tool_calls' in message %}\n {%- if not message.tool_calls|length == 1 %}\n {{- raise_exception(\"This model only supports single tool-calls at once!\") }}\n {%- endif %}\n {%- set tool_call = message.tool_calls[0].function %}\n {{- '<|start_header_id|>assistant<|end_header_id|>\\n\\n' -}}\n {{- '{\"name\": \"' + tool_call.name + '\", ' }}\n {{- '\"parameters\": ' }}\n {{- tool_call.arguments | tojson }}\n {{- \"}\" }}\n {{- \"<|eot_id|>\" }}\n {%- elif message.role == \"tool\" or message.role == \"ipython\" %}\n {{- \"<|start_header_id|>ipython<|end_header_id|>\\n\\n\" }}\n {%- if message.content is mapping or message.content is iterable %}\n {{- message.content | tojson }}\n {%- else %}\n {{- message.content }}\n {%- endif %}\n {{- \"<|eot_id|>\" }}\n {%- endif %}\n{%- endfor %}\n{%- if add_generation_prompt %}\n {{- '<|start_header_id|>assistant<|end_header_id|>\\n\\n' }}\n{%- endif %}\n",
2092
  "clean_up_tokenization_spaces": true,
2093
- "eos_token": "<|eot_id|>",
2094
  "extra_special_tokens": {},
2095
  "model_input_names": [
2096
  "input_ids",
2097
  "attention_mask"
2098
  ],
2099
  "model_max_length": 131072,
 
2100
  "tokenizer_class": "PreTrainedTokenizer"
2101
  }
 
2079
  "rstrip": false,
2080
  "single_word": false,
2081
  "special": true
2082
+ },
2083
+ "128260": {
2084
+ "content": "</img_base64>",
2085
+ "lstrip": false,
2086
+ "normalized": false,
2087
+ "rstrip": false,
2088
+ "single_word": false,
2089
+ "special": true
2090
+ },
2091
+ "128261": {
2092
+ "content": "</json_output>",
2093
+ "lstrip": false,
2094
+ "normalized": false,
2095
+ "rstrip": false,
2096
+ "single_word": false,
2097
+ "special": true
2098
+ },
2099
+ "128262": {
2100
+ "content": "</ocr_text>",
2101
+ "lstrip": false,
2102
+ "normalized": false,
2103
+ "rstrip": false,
2104
+ "single_word": false,
2105
+ "special": true
2106
+ },
2107
+ "128263": {
2108
+ "content": "</tool_code>",
2109
+ "lstrip": false,
2110
+ "normalized": false,
2111
+ "rstrip": false,
2112
+ "single_word": false,
2113
+ "special": true
2114
+ },
2115
+ "128264": {
2116
+ "content": "<img_base64>",
2117
+ "lstrip": false,
2118
+ "normalized": false,
2119
+ "rstrip": false,
2120
+ "single_word": false,
2121
+ "special": true
2122
+ },
2123
+ "128265": {
2124
+ "content": "<json_output>",
2125
+ "lstrip": false,
2126
+ "normalized": false,
2127
+ "rstrip": false,
2128
+ "single_word": false,
2129
+ "special": true
2130
+ },
2131
+ "128266": {
2132
+ "content": "<ocr_text>",
2133
+ "lstrip": false,
2134
+ "normalized": false,
2135
+ "rstrip": false,
2136
+ "single_word": false,
2137
+ "special": true
2138
+ },
2139
+ "128267": {
2140
+ "content": "<tool_code>",
2141
+ "lstrip": false,
2142
+ "normalized": false,
2143
+ "rstrip": false,
2144
+ "single_word": false,
2145
+ "special": true
2146
  }
2147
  },
2148
  "additional_special_tokens": [
2149
+ "</answer>",
2150
+ "</img_base64>",
2151
+ "</json_output>",
2152
+ "</ocr_text>",
2153
  "</thinking>",
2154
+ "</tool_code>",
2155
  "<answer>",
2156
+ "<img_base64>",
2157
+ "<json_output>",
2158
+ "<ocr_text>",
2159
+ "<thinking>",
2160
+ "<tool_code>"
2161
  ],
2162
  "bos_token": "<|begin_of_text|>",
2163
  "chat_template": "{{- bos_token }}\n{%- if custom_tools is defined %}\n {%- set tools = custom_tools %}\n{%- endif %}\n{%- if not tools_in_user_message is defined %}\n {%- set tools_in_user_message = true %}\n{%- endif %}\n{%- if not date_string is defined %}\n {%- if strftime_now is defined %}\n {%- set date_string = strftime_now(\"%d %b %Y\") %}\n {%- else %}\n {%- set date_string = \"26 Jul 2024\" %}\n {%- endif %}\n{%- endif %}\n{%- if not tools is defined %}\n {%- set tools = none %}\n{%- endif %}\n\n{#- This block extracts the system message, so we can slot it into the right place. #}\n{%- if messages[0]['role'] == 'system' %}\n {%- set system_message = messages[0]['content']|trim %}\n {%- set messages = messages[1:] %}\n{%- else %}\n {%- set system_message = \"\" %}\n{%- endif %}\n\n{#- System message #}\n{{- \"<|start_header_id|>system<|end_header_id|>\\n\\n\" }}\n{%- if tools is not none %}\n {{- \"Environment: ipython\\n\" }}\n{%- endif %}\n{{- \"Cutting Knowledge Date: December 2023\\n\" }}\n{{- \"Today Date: \" + date_string + \"\\n\\n\" }}\n{%- if tools is not none and not tools_in_user_message %}\n {{- \"You have access to the following functions. To call a function, please respond with JSON for a function call.\" }}\n {{- 'Respond in the format {\"name\": function name, \"parameters\": dictionary of argument name and its value}.' }}\n {{- \"Do not use variables.\\n\\n\" }}\n {%- for t in tools %}\n {{- t | tojson(indent=4) }}\n {{- \"\\n\\n\" }}\n {%- endfor %}\n{%- endif %}\n{{- system_message }}\n{{- \"<|eot_id|>\" }}\n\n{#- Custom tools are passed in a user message with some extra guidance #}\n{%- if tools_in_user_message and not tools is none %}\n {#- Extract the first user message so we can plug it in here #}\n {%- if messages | length != 0 %}\n {%- set first_user_message = messages[0]['content']|trim %}\n {%- set messages = messages[1:] %}\n {%- else %}\n {{- raise_exception(\"Cannot put tools in the first user message when there's no first user message!\") }}\n{%- endif %}\n {{- '<|start_header_id|>user<|end_header_id|>\\n\\n' -}}\n {{- \"Given the following functions, please respond with a JSON for a function call \" }}\n {{- \"with its proper arguments that best answers the given prompt.\\n\\n\" }}\n {{- 'Respond in the format {\"name\": function name, \"parameters\": dictionary of argument name and its value}.' }}\n {{- \"Do not use variables.\\n\\n\" }}\n {%- for t in tools %}\n {{- t | tojson(indent=4) }}\n {{- \"\\n\\n\" }}\n {%- endfor %}\n {{- first_user_message + \"<|eot_id|>\"}}\n{%- endif %}\n\n{%- for message in messages %}\n {%- if not (message.role == 'ipython' or message.role == 'tool' or 'tool_calls' in message) %}\n {{- '<|start_header_id|>' + message['role'] + '<|end_header_id|>\\n\\n'+ message['content'] | trim + '<|eot_id|>' }}\n {%- elif 'tool_calls' in message %}\n {%- if not message.tool_calls|length == 1 %}\n {{- raise_exception(\"This model only supports single tool-calls at once!\") }}\n {%- endif %}\n {%- set tool_call = message.tool_calls[0].function %}\n {{- '<|start_header_id|>assistant<|end_header_id|>\\n\\n' -}}\n {{- '{\"name\": \"' + tool_call.name + '\", ' }}\n {{- '\"parameters\": ' }}\n {{- tool_call.arguments | tojson }}\n {{- \"}\" }}\n {{- \"<|eot_id|>\" }}\n {%- elif message.role == \"tool\" or message.role == \"ipython\" %}\n {{- \"<|start_header_id|>ipython<|end_header_id|>\\n\\n\" }}\n {%- if message.content is mapping or message.content is iterable %}\n {{- message.content | tojson }}\n {%- else %}\n {{- message.content }}\n {%- endif %}\n {{- \"<|eot_id|>\" }}\n {%- endif %}\n{%- endfor %}\n{%- if add_generation_prompt %}\n {{- '<|start_header_id|>assistant<|end_header_id|>\\n\\n' }}\n{%- endif %}\n",
2164
  "clean_up_tokenization_spaces": true,
2165
+ "eos_token": "<|end_of_text|>",
2166
  "extra_special_tokens": {},
2167
  "model_input_names": [
2168
  "input_ids",
2169
  "attention_mask"
2170
  ],
2171
  "model_max_length": 131072,
2172
+ "pad_token": "<|end_of_text|>",
2173
  "tokenizer_class": "PreTrainedTokenizer"
2174
  }