vladislavbro commited on
Commit
ea5b596
·
verified ·
1 Parent(s): 217adb5

Upload 3 files

Browse files
Files changed (4) hide show
  1. .gitattributes +1 -0
  2. genai_config.json +8 -3
  3. llama3.data +3 -0
  4. llama3.onnx +2 -2
.gitattributes CHANGED
@@ -34,3 +34,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
  llama3.onnx.data filter=lfs diff=lfs merge=lfs -text
 
 
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
  llama3.onnx.data filter=lfs diff=lfs merge=lfs -text
37
+ llama3.data filter=lfs diff=lfs merge=lfs -text
genai_config.json CHANGED
@@ -5,14 +5,19 @@
5
  "decoder": {
6
  "session_options": {
7
  "log_id": "onnxruntime-genai",
8
- "provider_options": []
 
 
 
 
9
  },
10
  "filename": "model.onnx",
11
  "head_size": 64,
12
  "hidden_size": 1024,
13
  "inputs": {
14
- "input_ids": "input_ids",
15
  "attention_mask": "attention_mask",
 
16
  "past_key_names": "past_key_values.%d.key",
17
  "past_value_names": "past_key_values.%d.value"
18
  },
@@ -28,7 +33,7 @@
28
  "eos_token_id": 2,
29
  "pad_token_id": 2,
30
  "type": "llama",
31
- "vocab_size": 8
32
  },
33
  "search": {
34
  "diversity_penalty": 0.0,
 
5
  "decoder": {
6
  "session_options": {
7
  "log_id": "onnxruntime-genai",
8
+ "provider_options": [
9
+ {
10
+ "webgpu": {}
11
+ }
12
+ ]
13
  },
14
  "filename": "model.onnx",
15
  "head_size": 64,
16
  "hidden_size": 1024,
17
  "inputs": {
18
+ "inputs_embeds": "inputs_embeds",
19
  "attention_mask": "attention_mask",
20
+ "position_ids": "position_ids",
21
  "past_key_names": "past_key_values.%d.key",
22
  "past_value_names": "past_key_values.%d.value"
23
  },
 
33
  "eos_token_id": 2,
34
  "pad_token_id": 2,
35
  "type": "llama",
36
+ "vocab_size": 8194
37
  },
38
  "search": {
39
  "diversity_penalty": 0.0,
llama3.data ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:65a763b2501b0022b6405ddbd3fd1a0ee36c4b58731199e035d55efdb3424bad
3
+ size 2080645120
llama3.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1ec159c6eb08380e73772c6c303271bf8d9bc8778d0dbee7e7f14a7e391bc420
3
- size 169240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0a9cc8435d74a378709fb44057d1d8a4bfba1d6ce334668d5fd8cfb8e0a14684
3
+ size 222296