my models.ini for llamacpp:

[Jackrong-Qwopus3.6-35B-A3B-Coder-Q8_0_ROCMFPX]
model = /mnt/models/Jackrong-Qwopus3.6-35B-A3B-Coder-ROCMFPX/Jackrong-Qwopus3.6-35B-A3B-Coder-Q8_0_ROCMFPX_AGENT.gguf
mmproj = /mnt/models/Jackrong-Qwopus3.6-35B-A3B-Coder-ROCMFPX/mmproj-F32.gguf
chat-template-file = /mnt/models/Jackrong-Qwopus3.6-35B-A3B-Coder-ROCMFPX/chat_template.jinja
alias = jackrong-qwopus3.6-35b-a3b-coder-q8-rocmfpx
ctx-size = 262144
temp = 0.6
top-p = 0.95
top-k = 20
min-p = 0.0
presence-penalty = 0.0
repeat-penalty = 1.0
device = Vulkan0
spec-type = draft-mtp
spec-draft-device = Vulkan0
spec-draft-n-max = 2
spec-draft-ngl = all
spec-draft-type-k = f16
spec-draft-type-v = f16
spec-draft-n-min=0
spec-draft-p-min=0.0
spec-draft-p-split=0.10
np = 1
chat-template-kwargs = {"preserve_thinking": true}
cache-type-k = q8_0
cache-type-v = q8_0

[Jackrong-Qwopus3.6-35B-A3B-Coder-Q8_0_ROCMFPX-it]
model = /mnt/models/Jackrong-Qwopus3.6-35B-A3B-Coder-ROCMFPX/Jackrong-Qwopus3.6-35B-A3B-Coder-Q8_0_ROCMFPX_AGENT.gguf
mmproj = /mnt/models/Jackrong-Qwopus3.6-35B-A3B-Coder-ROCMFPX/mmproj-F32.gguf
chat-template-file = /mnt/models/Jackrong-Qwopus3.6-35B-A3B-Coder-ROCMFPX/chat_template.jinja
alias = jackrong-qwopus3.6-35b-a3b-coder-q8-rocmfpx-it
ctx-size = 262144
temp = 0.6
top-p = 0.95
top-k = 20
min-p = 0.0
presence-penalty = 0.0
repeat-penalty = 1.0
reasoning = off
reasoning-format = none
reasoning-budget = -1
no-context-shift = true
device = Vulkan0
spec-type = draft-mtp
spec-draft-device = Vulkan0
spec-draft-n-max = 2
spec-draft-ngl = all
spec-draft-type-k = f16
spec-draft-type-v = f16
spec-draft-n-min=0
spec-draft-p-min=0.0
spec-draft-p-split=0.10
np = 1
cache-type-k = q8_0
cache-type-v = q8_0
Downloads last month
6,279
GGUF
Model size
36B params
Architecture
qwen35moe
Hardware compatibility
Log In to add your hardware

4-bit

8-bit

Inference Providers NEW
This model isn't deployed by any Inference Provider. 🙋 Ask for provider support

Model tree for rcmorano/Jackrong-Qwopus3.6-35B-A3B-Coder-ROCMFPX