| { | |
| "dialog": { | |
| "version": 1, | |
| "type": "basic", | |
| "context": { | |
| "version": 1, | |
| "size": 4096, | |
| "n-vocab": 128256, | |
| "bos-token": -1, | |
| "eos-token": [ | |
| 128001, | |
| 128009, | |
| 128008 | |
| ] | |
| }, | |
| "sampler": { | |
| "version": 1, | |
| "seed": 42, | |
| "temp": 0.8, | |
| "top-k": 40, | |
| "top-p": 0.95 | |
| }, | |
| "tokenizer": { | |
| "version": 1, | |
| "path": "tokenizer.json" | |
| }, | |
| "engine": { | |
| "version": 1, | |
| "n-threads": 3, | |
| "backend": { | |
| "version": 1, | |
| "type": "QnnHtp", | |
| "QnnHtp": { | |
| "version": 1, | |
| "use-mmap": false, | |
| "spill-fill-bufsize": 0, | |
| "mmap-budget": 0, | |
| "poll": true, | |
| "cpu-mask": "0xe0", | |
| "kv-dim": 128, | |
| "allow-async-init": false | |
| }, | |
| "extensions": "htp_backend_ext_config.json" | |
| }, | |
| "model": { | |
| "version": 1, | |
| "type": "binary", | |
| "binary": { | |
| "version": 1, | |
| "ctx-bins": [ | |
| "llama_v3_2_3b_chat_quantized_part_1_of_3.bin", | |
| "llama_v3_2_3b_chat_quantized_part_2_of_3.bin", | |
| "llama_v3_2_3b_chat_quantized_part_3_of_3.bin" | |
| ] | |
| }, | |
| "positional-encoding": { | |
| "type": "rope", | |
| "rope-dim": 64, | |
| "rope-theta": 500000, | |
| "rope-scaling": { | |
| "rope-type": "llama3", | |
| "factor": 8.0, | |
| "low-freq-factor": 1.0, | |
| "high-freq-factor": 4.0, | |
| "original-max-position-embeddings": 8192 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } |