satreysa commited on
Commit
575bdf3
·
verified ·
1 Parent(s): 484773e

Upload 8 files

Browse files
Files changed (2) hide show
  1. Olmo-1B-SFT_jit.onnx +2 -2
  2. genai_config.json +25 -25
Olmo-1B-SFT_jit.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e5c44b486eba950436bb184ad6a6c45eeecb5d2291d8630f93bebc0d1bd9785d
3
- size 143991
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:72965fae6672c8ceb83533af36d4b3aa78437fb0a1c1f12ff603878e44354366
3
+ size 143951
genai_config.json CHANGED
@@ -5,35 +5,35 @@
5
  "decoder": {
6
  "session_options": {
7
  "log_id": "onnxruntime-genai",
8
- "custom_ops_library": "C:\\Users\\satreysa\\Downloads\\Python run\\hybrid-llm-artifacts_1.3.0\\hybrid-llm-artifacts\\onnx_utils\\bin\\onnx_custom_ops.dll",
9
  "custom_allocator": "shared_d3d_xrt",
10
- "external_data_file": "Olmo-1B-SFT_jit.pb.bin",
11
  "provider_options": [
12
  ]
13
  },
14
- "filename": "Olmo-1B-SFT_jit.onnx",
15
- "head_size": 128,
16
- "hidden_size": 2048,
17
- "inputs": {
18
- "input_ids": "input_ids",
19
- "attention_mask": "attention_mask",
20
- "position_ids": "position_ids",
21
- "past_key_names": "past_key_values.%d.key",
22
- "past_value_names": "past_key_values.%d.value"
23
- },
24
- "outputs": {
25
- "logits": "logits",
26
- "present_key_names": "present.%d.key",
27
- "present_value_names": "present.%d.value"
28
- },
29
- "num_attention_heads": 16,
30
- "num_hidden_layers": 16,
31
- "num_key_value_heads": 16
32
- },
33
- "eos_token_id": 0,
34
- "pad_token_id": 1,
35
- "type": "olmo",
36
- "vocab_size": 50304
37
  },
38
  "search": {
39
  "diversity_penalty": 0.0,
 
5
  "decoder": {
6
  "session_options": {
7
  "log_id": "onnxruntime-genai",
8
+ "custom_ops_library": "onnx_custom_ops.dll",
9
  "custom_allocator": "shared_d3d_xrt",
10
+ "external_data_file": "Phi-3-mini-4k_jit.pb.bin",
11
  "provider_options": [
12
  ]
13
  },
14
+ "filename": "Phi-3-mini-4k_jit.onnx",
15
+ "head_size": 128,
16
+ "hidden_size": 2048,
17
+ "inputs": {
18
+ "input_ids": "input_ids",
19
+ "attention_mask": "attention_mask",
20
+ "position_ids": "position_ids",
21
+ "past_key_names": "past_key_values.%d.key",
22
+ "past_value_names": "past_key_values.%d.value"
23
+ },
24
+ "outputs": {
25
+ "logits": "logits",
26
+ "present_key_names": "present.%d.key",
27
+ "present_value_names": "present.%d.value"
28
+ },
29
+ "num_attention_heads": 16,
30
+ "num_hidden_layers": 16,
31
+ "num_key_value_heads": 16
32
+ },
33
+ "eos_token_id": 0,
34
+ "pad_token_id": 1,
35
+ "type": "olmo",
36
+ "vocab_size": 50304
37
  },
38
  "search": {
39
  "diversity_penalty": 0.0,