satreysa commited on
Commit
72a7845
·
verified ·
1 Parent(s): c0c02ce

Update genai_config.json

Browse files
Files changed (1) hide show
  1. genai_config.json +54 -54
genai_config.json CHANGED
@@ -1,55 +1,55 @@
1
- {
2
- "model": {
3
- "bos_token_id": 128000,
4
- "context_length": 131072,
5
- "decoder": {
6
- "session_options": {
7
- "log_id": "onnxruntime-genai",
8
- "custom_ops_library": "<path_to>\\onnx_custom_ops.dll",
9
- "external_data_file": "DeepSeek-R1-Distill-Llama-8B.pb.bin",
10
- "custom_allocator": "shared_d3d_xrt",
11
- "hybrid_opt_free_after_prefill": "0",
12
- "hybrid_opt_gpu_jit": "0",
13
- "provider_options": []
14
- },
15
- "filename": "DeepSeek-R1-Distill-Llama-8B.onnx",
16
- "head_size": 128,
17
- "hidden_size": 4096,
18
- "inputs": {
19
- "input_ids": "input_ids",
20
- "attention_mask": "attention_mask",
21
- "position_ids": "position_ids",
22
- "past_key_names": "past_key_values.%d.key",
23
- "past_value_names": "past_key_values.%d.value"
24
- },
25
- "outputs": {
26
- "logits": "logits",
27
- "present_key_names": "present.%d.key",
28
- "present_value_names": "present.%d.value"
29
- },
30
- "num_attention_heads": 32,
31
- "num_hidden_layers": 32,
32
- "num_key_value_heads": 8
33
- },
34
- "eos_token_id": 128001,
35
- "pad_token_id": 128001,
36
- "type": "llama",
37
- "vocab_size": 128256
38
- },
39
- "search": {
40
- "diversity_penalty": 0.0,
41
- "do_sample": true,
42
- "early_stopping": true,
43
- "length_penalty": 1.0,
44
- "max_length": 131072,
45
- "min_length": 0,
46
- "no_repeat_ngram_size": 0,
47
- "num_beams": 1,
48
- "num_return_sequences": 1,
49
- "past_present_share_buffer": true,
50
- "repetition_penalty": 1.0,
51
- "temperature": 0.6,
52
- "top_k": 1,
53
- "top_p": 0.95
54
- }
55
  }
 
1
+ {
2
+ "model": {
3
+ "bos_token_id": 128000,
4
+ "context_length": 131072,
5
+ "decoder": {
6
+ "session_options": {
7
+ "log_id": "onnxruntime-genai",
8
+ "custom_ops_library": "onnx_custom_ops.dll",
9
+ "external_data_file": "DeepSeek-R1-Distill-Llama-8B.pb.bin",
10
+ "custom_allocator": "shared_d3d_xrt",
11
+ "hybrid_opt_free_after_prefill": "0",
12
+ "hybrid_opt_gpu_jit": "0",
13
+ "provider_options": []
14
+ },
15
+ "filename": "DeepSeek-R1-Distill-Llama-8B.onnx",
16
+ "head_size": 128,
17
+ "hidden_size": 4096,
18
+ "inputs": {
19
+ "input_ids": "input_ids",
20
+ "attention_mask": "attention_mask",
21
+ "position_ids": "position_ids",
22
+ "past_key_names": "past_key_values.%d.key",
23
+ "past_value_names": "past_key_values.%d.value"
24
+ },
25
+ "outputs": {
26
+ "logits": "logits",
27
+ "present_key_names": "present.%d.key",
28
+ "present_value_names": "present.%d.value"
29
+ },
30
+ "num_attention_heads": 32,
31
+ "num_hidden_layers": 32,
32
+ "num_key_value_heads": 8
33
+ },
34
+ "eos_token_id": 128001,
35
+ "pad_token_id": 128001,
36
+ "type": "llama",
37
+ "vocab_size": 128256
38
+ },
39
+ "search": {
40
+ "diversity_penalty": 0.0,
41
+ "do_sample": true,
42
+ "early_stopping": true,
43
+ "length_penalty": 1.0,
44
+ "max_length": 131072,
45
+ "min_length": 0,
46
+ "no_repeat_ngram_size": 0,
47
+ "num_beams": 1,
48
+ "num_return_sequences": 1,
49
+ "past_present_share_buffer": true,
50
+ "repetition_penalty": 1.0,
51
+ "temperature": 0.6,
52
+ "top_k": 1,
53
+ "top_p": 0.95
54
+ }
55
  }