EnricoFermi commited on
Commit
56b1bd6
·
verified ·
1 Parent(s): 4d4463a

Correct qwen3.5-4b-code-forged-GGUF.alloy.json pass@1 to canonical evalplus convention (v1.0.0)

Browse files
qwen3.5-4b-code-forged-GGUF.alloy.json ADDED
@@ -0,0 +1,124 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "name": "qwen3.5-4b-code-forged-GGUF",
3
+ "version": "1.0.0",
4
+ "description": "GGUF derivative of [`qwen3.5-4b-code-forged`](https://huggingface.co/continuum-ai/qwen3.5-4b-code-forged). Same forge journey as the parent (prune + train as published in the parent's alloy); this artifact adds a single 'gguf' transformation stage to produce a smaller / faster / more-portable variant of the same logical model. Inherits the parent's published benchmark results; per-variant evaluation samples will land in a follow-up release if/when per-variant benchmarks are run.",
5
+ "author": "continuum-ai",
6
+ "tags": [
7
+ "derivative",
8
+ "delta-forge",
9
+ "alloy-backfilled",
10
+ "gguf",
11
+ "forge-alloy"
12
+ ],
13
+ "license": "apache-2.0",
14
+ "source": {
15
+ "baseModel": "Qwen/Qwen3.5-4B",
16
+ "architecture": "qwen3_5",
17
+ "isMoE": false
18
+ },
19
+ "stages": [
20
+ {
21
+ "type": "train",
22
+ "domain": "code",
23
+ "steps": 1000,
24
+ "learningRate": "2e-4"
25
+ },
26
+ {
27
+ "type": "quant",
28
+ "format": "gguf",
29
+ "quantTypes": [
30
+ "Q4_K_M"
31
+ ],
32
+ "deviceTargets": []
33
+ },
34
+ {
35
+ "type": "eval",
36
+ "benchmarks": [
37
+ {
38
+ "name": "humaneval"
39
+ }
40
+ ],
41
+ "compareToBase": true
42
+ },
43
+ {
44
+ "type": "quant",
45
+ "format": "gguf",
46
+ "quantTypes": [
47
+ "Q4_K_M",
48
+ "Q8_0"
49
+ ],
50
+ "deviceTargets": [
51
+ "macbook-pro-m-series",
52
+ "macbook-air-16gb",
53
+ "rtx3060",
54
+ "rtx4070",
55
+ "rtx4090",
56
+ "iphone",
57
+ "android"
58
+ ],
59
+ "notes": "GGUF quantization of the parent's safetensors weights via llama.cpp llama-quantize. Targets llama.cpp / Ollama / LM Studio / koboldcpp inference runtimes. Q4_K_M and Q8_0 shipped together so users can pick the size/quality tier their hardware supports."
60
+ }
61
+ ],
62
+ "cycles": 3,
63
+ "derivedFrom": {
64
+ "repo": "continuum-ai/qwen3.5-4b-code-forged",
65
+ "alloyHash": null,
66
+ "kind": "gguf"
67
+ },
68
+ "results": {
69
+ "completedAt": "2026-03-31T12:13:43-0500",
70
+ "baselinePerplexity": 3.0382,
71
+ "finalPerplexity": 2.3487,
72
+ "improvementPct": 22.7,
73
+ "benchmarks": [
74
+ {
75
+ "name": "perplexity",
76
+ "metrics": {
77
+ "baseline": 3.0382,
78
+ "final": 2.3487,
79
+ "improvement": 22.7
80
+ }
81
+ },
82
+ {
83
+ "name": "humaneval",
84
+ "subset": null,
85
+ "metrics": {
86
+ "status": "pending"
87
+ },
88
+ "submittedToLeaderboard": false
89
+ }
90
+ ],
91
+ "hardwareVerified": [
92
+ {
93
+ "device": "NVIDIA GeForce RTX 5090",
94
+ "format": "fp16",
95
+ "verified": true
96
+ }
97
+ ],
98
+ "samples": [],
99
+ "integrity": {
100
+ "trustLevel": "self-attested",
101
+ "code": {
102
+ "runner": "sentinel-ai/derive_alloy_from_parent (gguf)",
103
+ "version": "1.0",
104
+ "binaryHash": "sha256:derivation-tool-only"
105
+ },
106
+ "modelHash": "sha256:03dd512b17b85b9b4ee6614bc6dd46c08d0bc8e07b92f01b2934540e4f5cbb96",
107
+ "fileHashes": [
108
+ {
109
+ "filename": "qwen3.5-4b-code-forged-Q4_K_M.gguf",
110
+ "sha256": "15c8ebc22ac16e3e922041f25d285f8a322e228196de0e9b12592b8bf8b7646e",
111
+ "size": 2708797184
112
+ },
113
+ {
114
+ "filename": "qwen3.5-4b-code-forged-Q8_0.gguf",
115
+ "sha256": "c56465451bef33353a1f075d670d07bb11c11f60d4463c6bd4fb24f6155acd40",
116
+ "size": 4482395904
117
+ }
118
+ ],
119
+ "datasets": [],
120
+ "attestedAt": "2026-04-08",
121
+ "parentAlloyHash": null
122
+ }
123
+ }
124
+ }