cmh commited on
Commit
d9704bf
·
verified ·
1 Parent(s): ed29b6c

Upload 8 files

Browse files
.gitattributes CHANGED
@@ -33,3 +33,5 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ size_kld_plot_Qwen3.6-35B-A3B.png filter=lfs diff=lfs merge=lfs -text
37
+ size_ppl_plot_Qwen3.6-35B-A3B.png filter=lfs diff=lfs merge=lfs -text
3d_Qwen3.6-35B-A3B.html ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ <html>
2
+ <head><meta charset="utf-8" /></head>
3
+ <body>
4
+ <div> <script>window.PlotlyConfig = {MathJaxConfig: 'local'};</script>
5
+ <script charset="utf-8" src="https://cdn.plot.ly/plotly-3.5.0.min.js" integrity="sha256-fHbNLP+GlIXN+efbQec78UkemUz3NJp7UmfGxC1tNxs=" crossorigin="anonymous"></script> <div id="43b7d76c-8672-4e46-bcd0-71849007cb6f" class="plotly-graph-div" style="height:900px; width:1200px;"></div> <script> window.PLOTLYENV=window.PLOTLYENV || {}; if (document.getElementById("43b7d76c-8672-4e46-bcd0-71849007cb6f")) { Plotly.newPlot( "43b7d76c-8672-4e46-bcd0-71849007cb6f", [{"customdata":[["mradermacher_i1-IQ4_XS"]],"hovertemplate":"\u003cb\u003e%{customdata[0]}\u003c\u002fb\u003e\u003cbr\u003eStatus: Pareto-optimal\u003cbr\u003e\u003cextra\u003e\u003c\u002fextra\u003e","legendgroup":"mradermacher","marker":{"color":"#4477AA","line":{"color":"white","width":0.5},"opacity":1.0,"size":10},"mode":"markers+text","name":"mradermacher","showlegend":true,"text":["i1-IQ4_XS"],"textfont":{"color":"white","size":9},"textposition":"top center","x":{"dtype":"f8","bdata":"xSCwcmhxMUA="},"y":{"dtype":"f8","bdata":"HcwmwLD8oT8="},"z":{"dtype":"f8","bdata":"+GuyRj20HUA="},"type":"scatter3d"},{"customdata":[["sphaela_Q8_0"]],"hovertemplate":"\u003cb\u003e%{customdata[0]}\u003c\u002fb\u003e\u003cbr\u003eStatus: Pareto-optimal\u003cbr\u003e\u003cextra\u003e\u003c\u002fextra\u003e","legendgroup":"sphaela","marker":{"color":"#228833","line":{"color":"white","width":0.5},"opacity":1.0,"size":10},"mode":"markers+text","name":"sphaela","showlegend":true,"text":["Q8_0"],"textfont":{"color":"white","size":9},"textposition":"top center","x":{"dtype":"f8","bdata":"rBxaZDsvQUA="},"y":{"dtype":"f8","bdata":"tcU1PpP9gz8="},"z":{"dtype":"f8","bdata":"JEbPLXRlHUA="},"type":"scatter3d"},{"customdata":[["0xSero_Q8_0"]],"hovertemplate":"\u003cb\u003e%{customdata[0]}\u003c\u002fb\u003e\u003cbr\u003eStatus: Pareto-optimal\u003cbr\u003e\u003cextra\u003e\u003c\u002fextra\u003e","legendgroup":"0xSero","marker":{"color":"#CCBB44","line":{"color":"white","width":0.5},"opacity":1.0,"size":10},"mode":"markers+text","name":"0xSero","showlegend":true,"text":["Q8_0"],"textfont":{"color":"white","size":9},"textposition":"top center","x":{"dtype":"f8","bdata":"rBxaZDsvQUA="},"y":{"dtype":"f8","bdata":"Q+T09XzNgj8="},"z":{"dtype":"f8","bdata":"eXWOAdlrHUA="},"type":"scatter3d"},{"customdata":[["MXFP4_MOE"]],"hovertemplate":"\u003cb\u003e%{customdata[0]}\u003c\u002fb\u003e\u003cbr\u003eStatus: Pareto-optimal\u003cbr\u003e\u003cextra\u003e\u003c\u002fextra\u003e","legendgroup":"MXFP4","marker":{"color":"#AA3377","line":{"color":"white","width":0.5},"opacity":1.0,"size":10},"mode":"markers+text","name":"MXFP4","showlegend":true,"text":["MOE"],"textfont":{"color":"white","size":9},"textposition":"top center","x":{"dtype":"f8","bdata":"AAAAAADgMkA="},"y":{"dtype":"f8","bdata":"V89J7xtfoz8="},"z":{"dtype":"f8","bdata":"jrJ+MzF9HUA="},"type":"scatter3d"},{"customdata":[["AesSedai_IQ4_XS"],["AesSedai_Q4_K_M"],["AesSedai_Q5_K_M"],["AesSedai_Q6_K"]],"hovertemplate":"\u003cb\u003e%{customdata[0]}\u003c\u002fb\u003e\u003cbr\u003eStatus: Pareto-optimal\u003cbr\u003e\u003cextra\u003e\u003c\u002fextra\u003e","legendgroup":"AesSedai","marker":{"color":"#4477AA","line":{"color":"white","width":0.5},"opacity":1.0,"size":10},"mode":"markers+text","name":"AesSedai","showlegend":true,"text":["IQ4_XS","Q4_K_M","Q5_K_M","Q6_K"],"textfont":{"color":"white","size":9},"textposition":"top center","x":{"dtype":"f8","bdata":"SOF6FK5nMEA5tMh2vp80QMHKoUW2czhAz\u002fdT46UbO0A="},"y":{"dtype":"f8","bdata":"jNmSVRFuoj8\u002fqfbpeMyQP77bvHFSmIc\u002fMNgN2xZlhj8="},"z":{"dtype":"f8","bdata":"uaXVkLhHHkBC0qdV9HcdQPsGJjeKbB1A3V1nQ\u002f55HUA="},"type":"scatter3d"},{"customdata":[["bartowski_IQ4_XS"],["bartowski_IQ4_NL"],["bartowski_Q4_0"],["bartowski_Q4_K_S"],["bartowski_Q4_K_L"],["bartowski_Q5_K_S"],["bartowski_Q8_0"]],"hovertemplate":"\u003cb\u003e%{customdata[0]}\u003c\u002fb\u003e\u003cbr\u003eStatus: Pareto-optimal\u003cbr\u003e\u003cextra\u003e\u003c\u002fextra\u003e","legendgroup":"bartowski","marker":{"color":"#EE6677","line":{"color":"white","width":0.5},"opacity":1.0,"size":10},"mode":"markers+text","name":"bartowski","showlegend":true,"text":["IQ4_XS","IQ4_NL","Q4_0","Q4_K_S","Q4_K_L","Q5_K_S","Q8_0"],"textfont":{"color":"white","size":9},"textposition":"top center","x":{"dtype":"f8","bdata":"pHA9CteDMUCsHFpkO38yQKabxCCwkjJAIbByaJEtM0CgGi\u002fdJEY0QKwcWmQ7fzZAjZduEoMwQUA="},"y":{"dtype":"f8","bdata":"UhA8vr1roD95d2SsNv+fPxjQC3cujKQ\u002fQni0ccRanD\u002fy0He3skSXP2WNeohGd5A\u002fR+NQvwtbgz8="},"z":{"dtype":"f8","bdata":"mmA41zCjHUBSKXY0DqUdQAk02NR5hB1AZTcz+tHgHUCil1Est5QdQMPTK2UZgh1ADypxHeNqHUA="},"type":"scatter3d"},{"customdata":[["unsloth_UD-IQ4_NL_XL"],["unsloth_UD-Q4_K_S"],["unsloth_MXFP4_MOE"],["unsloth_UD-Q4_K_M"],["unsloth_UD-Q5_K_S"],["unsloth_UD-Q5_K_M"],["unsloth_UD-Q6_K"],["unsloth_UD-Q6_K_XL"]],"hovertemplate":"\u003cb\u003e%{customdata[0]}\u003c\u002fb\u003e\u003cbr\u003eStatus: Pareto-optimal\u003cbr\u003e\u003cextra\u003e\u003c\u002fextra\u003e","legendgroup":"unsloth","marker":{"color":"#228833","line":{"color":"white","width":0.5},"opacity":1.0,"size":10},"mode":"markers+text","name":"unsloth","showlegend":true,"text":["UD-IQ4_NL_XL","UD-Q4_K_S","MXFP4_MOE","UD-Q4_K_M","UD-Q5_K_S","UD-Q5_K_M","UD-Q6_K","UD-Q6_K_XL"],"textfont":{"color":"white","size":9},"textposition":"top center","x":{"dtype":"f8","bdata":"8KfGSzcpMkBoke18P3UzQNejcD0KNzRAd76fGi+dNEC0yHa+nzo3QN0kBoGVozhAsp3vp8ZLO0DVeOkmMag9QA=="},"y":{"dtype":"f8","bdata":"Yk7QJodPmj+5xJEHIouUPyBe1y\u002fYDZs\u002f66hqgqj7kD8PgSOBBpuKP2VvKeeLvYc\u002fLIApAwe0hD\u002fThy6ob5mDPw=="},"z":{"dtype":"f8","bdata":"Y2LzcW3oHUAixQCJJrAdQGa7Qh8sYx1AzOzzGOWZHUDTTPc6qV8dQJBMh07PWx1AcodNZOZyHUBETfT5KIMdQA=="},"type":"scatter3d"},{"customdata":[["mudler_APEX-I-Mini"],["mudler_APEX-I-Compact"],["mudler_APEX-I-Quality"]],"hovertemplate":"\u003cb\u003e%{customdata[0]}\u003c\u002fb\u003e\u003cbr\u003eStatus: Pareto-optimal\u003cbr\u003e\u003cextra\u003e\u003c\u002fextra\u003e","legendgroup":"mudler","marker":{"color":"#66CCEE","line":{"color":"white","width":0.5},"opacity":1.0,"size":10},"mode":"markers+text","name":"mudler","showlegend":true,"text":["APEX-I-Mini","APEX-I-Compact","APEX-I-Quality"],"textfont":{"color":"white","size":9},"textposition":"top center","x":{"dtype":"f8","bdata":"0SLb+X6qKkB7FK5H4RowQI2XbhKDQDVA"},"y":{"dtype":"f8","bdata":"qaPjamRXtj9sIjMXuDymP+MZNPRPcJE\u002f"},"z":{"dtype":"f8","bdata":"Ek2giEUcH0DVQPM5d+sdQKpkAKjiVh1A"},"type":"scatter3d"},{"customdata":[["Thireus_6.0569bpw"]],"hovertemplate":"\u003cb\u003e%{customdata[0]}\u003c\u002fb\u003e\u003cbr\u003eStatus: Pareto-optimal\u003cbr\u003e\u003cextra\u003e\u003c\u002fextra\u003e","legendgroup":"Thireus","marker":{"color":"#AA3377","line":{"color":"white","width":0.5},"opacity":1.0,"size":10},"mode":"markers+text","name":"Thireus","showlegend":true,"text":["6.0569bpw"],"textfont":{"color":"white","size":9},"textposition":"top center","x":{"dtype":"f8","bdata":"MzMzMzNzOEA="},"y":{"dtype":"f8","bdata":"mIi3zr9dhj8="},"z":{"dtype":"f8","bdata":"o3kAi\u002fx6HUA="},"type":"scatter3d"},{"customdata":[["mradermacher_i1-Q4_0"],["mradermacher_i1-Q4_K_S"],["mradermacher_i1-Q4_K_M"],["mradermacher_i1-Q4_1"],["mradermacher_i1-Q5_K_S"],["mradermacher_i1-Q5_K_M"],["mradermacher_i1-Q6_K"],["batiai_IQ4_XS"],["batiai_Q4_K_M"],["batiai_Q5_K_M"],["batiai_Q6_K"],["batiai_Q8_0"],["sphaela_Q4_0"],["sphaela_Q4_K_M"],["sphaela_Q4_K_S"],["0xSero_Q4_0"],["worthdoing_Q4_K_S"],["0xSero_IQ4_NL"],["0xSero_DYNAMIC"],["0xSero_Q4_K_M"],["worthdoing_Q4_K_M"],["steampunque_Q4_K_H"],["sphaela_Q4_1"],["sphaela_Q5_0"],["sphaela_Q5_K_M"],["sphaela_Q5_K_S"],["worthdoing_Q5_K_S"],["0xSero_Q5_K_M"],["worthdoing_Q5_K_M"],["sphaela_Q5_1"],["0xSero_Q6_K"],["worthdoing_Q8_0"],["bartowski_Q4_K_M"],["bartowski_Q4_1"],["bartowski_Q5_K_M"],["bartowski_Q5_K_L"],["bartowski_Q6_K"],["bartowski_Q6_K_L"],["unsloth_UD-IQ4_XS"],["unsloth_UD-IQ4_NL"],["unsloth_UD-Q4_K_XL"],["unsloth_UD-Q5_K_XL"],["unsloth_Q8_0"],["unsloth_UD-Q8_K_XL"],["lmstudio_Q4_K_M"],["lmstudio_Q6_K"],["lmstudio_Q8_0"],["mudler_APEX-Compact"],["mudler_APEX-Quality"],["mudler_APEX-Balanced"],["mudler_APEX-I-Balanced"],["Thireus_4.0579bpw"],["Thireus_4.5077bpw"],["Thireus_4.8273bpw"],["Thireus_5.1174bpw"],["Thireus_5.5079bpw"],["Thireus_5.7548bpw"],["Thireus_6.7626bpw"]],"hovertemplate":"\u003cb\u003e%{customdata[0]}\u003c\u002fb\u003e\u003cbr\u003eStatus: dominated\u003cbr\u003e\u003cextra\u003e\u003c\u002fextra\u003e","legendgroup":"dominated","marker":{"color":"#888888","opacity":0.15,"size":10},"mode":"markers","name":"(dominated)","showlegend":true,"x":{"dtype":"f8","bdata":"cT0K16NwMkCgGi\u002fdJIYyQEoMAiuHtjNADAIrhxZZNEAv3SQGgVU2QA4tsp3vBzdAdZMYBFaOOkDFILByaHExQEoMAiuHtjNADi2yne8HN0B1kxgEVo46QKwcWmQ7L0FAI9v5fmpcMkAj2\u002fl+alwyQCPb+X5qXDJAI9v5fmpcMkCgGi\u002fdJIYyQIcW2c73kzJAMzMzMzMTM0BKDAIrh7YzQEoMAiuHtjNAzczMzMzsM0AMAiuHFlk0QC\u002fdJAaBVTZAL90kBoFVNkAv3SQGgVU2QC\u002fdJAaBVTZADi2yne8HN0AOLbKd7wc3QBkEVg4tUjhAdZMYBFaOOkCsHFpkOy9BQHnpJjEI7DNA16NwPQp3NEAGgZVDi0w3QGQ730+NlzdAd76fGi\u002f9O0Dy0k1iEDg8QBfZzvdTgzBAWmQ730\u002fNMEAzMzMzM9M0QGq8dJMYxDhArBxaZDsvQUBI4XoUrudBQEoMAiuHtjNAdZMYBFaOOkCsHFpkOy9BQHsUrkfhGjBAjZduEoNANUA9CtejcN03QD0K16Nw3TdA\u002fKnx0k1iMEBQjZduEkMyQJMYBFYOjTNAYhBYObSoNEBcj8L1KDw2QEJg5dAiOzdAPzVeuklMO0A="},"y":{"dtype":"f8","bdata":"FZFhFW9krj9UcHhBRGqiP+YeEr73N6A\u002fsHYU56ijoz\u002fMtz6sN2qVPyxjQzf7A5U\u002fKZZbWg2Jiz\u002fvdVJflnaiP28qUmFsIaA\u002fl+SAXU2ekj86kst\u002fSL+NP135LM+Du4M\u002fRu9UwD3Prz+tS43Qz9SjP61LjdDP1KM\u002f9x3DYz+LsT+rsBnggmyxP2bdPxaiQ6g\u002fWp2cobjjpT88FAX6RJ6sP+qWHeIftqw\u002fbcmqCDcZpT+eQxmqYiq1PydnKO54k58\u002fB3qobcMosD8HeqhtwyiwP7MHWoEhq5s\u002f\u002fWmjOh3Imj9n7bYLzXWaP95VD5iHTKE\u002fUg5mE2BYjj8yAFRx4xaDPzdV98jmqpk\u002foWgewCK\u002fnj+srdhfdk+OPzv\u002fdtmvO40\u002frws\u002fOJ86hj\u002f600Z1OpCFP1JF8Sprm6I\u002ft5c0Ruuooj\u002fToj7JHTaRPzQw8rImFog\u002fya8fYoOFgz9YjSWsjbGDPzwUBfpEnqw\u002fogip29lXjj\u002fy6bEtA86CP16AfXTqyq8\u002fby2T4Xg+kz+VLCeh9IWQP+NRKuEJvY4\u002fVDiCVIodsT+Ug9kEGJanP+yIQzaQLqY\u002fJ09ZTdcTpT\u002fGv8+4cCCkP8yYgjXOpqM\u002ft7dbkgN2hT8="},"z":{"dtype":"f8","bdata":"on+CixXlHUD19BH4w\u002f8dQOfEHtrH2h1A8UV7vJAeHkCgpwGDpG8dQGmtaHOcax1AQGt+\u002fKV1HUBTPZl\u002f9M0dQOYg6GhV2x1ADhDM0eOHHUCdLSC0Ho4dQCLCvwgacx1AEce6uI3WHUAt6L0xBBAeQC3ovTEEEB5A1GGFWz7yHUDcDg2LUScfQPktOllqzR1AaHqJsUzvHUDX+bfLfp0eQL+36c9+pB5Aa0qyDkcnHkAaogp\u002fhhceQPt46Ltb6R1A8Q7wpIULH0DxDvCkhQsfQPmCFhIwuh1A4gM7\u002fgu0HUAOvcXDe64dQGhaYmU0ch1AfbH34ouWHUAVb2Qe+XMdQNRFCmXhux1AMdEgBU\u002fBHUAsms5OBocdQPfJUYAoaB1A4A8\u002f\u002fz2IHUDCoiJOJ3kdQIqQup19ZR5Ap88OuK5oHkAMlBRYAJMdQOqwwi0faR1Arrg4KjdxHUAfK\u002fhtiHEdQNf5t8t+nR5A6bga2ZWWHUCEDOTZ5WsdQN1hE5m5gB5A2SWqtwaWHUDW\u002fPhLi4odQNZXVwVqYR1AODC5UWQNH0CFP8ObNWgeQKPnFroSUR5Au\u002fHuyFgdHkBqaAOwAUEeQG7dzVMdQh5AQ+IeSx96HUA="},"type":"scatter3d"}], {"template":{"data":{"histogram2dcontour":[{"type":"histogram2dcontour","colorbar":{"outlinewidth":0,"ticks":""},"colorscale":[[0.0,"#0d0887"],[0.1111111111111111,"#46039f"],[0.2222222222222222,"#7201a8"],[0.3333333333333333,"#9c179e"],[0.4444444444444444,"#bd3786"],[0.5555555555555556,"#d8576b"],[0.6666666666666666,"#ed7953"],[0.7777777777777778,"#fb9f3a"],[0.8888888888888888,"#fdca26"],[1.0,"#f0f921"]]}],"choropleth":[{"type":"choropleth","colorbar":{"outlinewidth":0,"ticks":""}}],"histogram2d":[{"type":"histogram2d","colorbar":{"outlinewidth":0,"ticks":""},"colorscale":[[0.0,"#0d0887"],[0.1111111111111111,"#46039f"],[0.2222222222222222,"#7201a8"],[0.3333333333333333,"#9c179e"],[0.4444444444444444,"#bd3786"],[0.5555555555555556,"#d8576b"],[0.6666666666666666,"#ed7953"],[0.7777777777777778,"#fb9f3a"],[0.8888888888888888,"#fdca26"],[1.0,"#f0f921"]]}],"heatmap":[{"type":"heatmap","colorbar":{"outlinewidth":0,"ticks":""},"colorscale":[[0.0,"#0d0887"],[0.1111111111111111,"#46039f"],[0.2222222222222222,"#7201a8"],[0.3333333333333333,"#9c179e"],[0.4444444444444444,"#bd3786"],[0.5555555555555556,"#d8576b"],[0.6666666666666666,"#ed7953"],[0.7777777777777778,"#fb9f3a"],[0.8888888888888888,"#fdca26"],[1.0,"#f0f921"]]}],"contourcarpet":[{"type":"contourcarpet","colorbar":{"outlinewidth":0,"ticks":""}}],"contour":[{"type":"contour","colorbar":{"outlinewidth":0,"ticks":""},"colorscale":[[0.0,"#0d0887"],[0.1111111111111111,"#46039f"],[0.2222222222222222,"#7201a8"],[0.3333333333333333,"#9c179e"],[0.4444444444444444,"#bd3786"],[0.5555555555555556,"#d8576b"],[0.6666666666666666,"#ed7953"],[0.7777777777777778,"#fb9f3a"],[0.8888888888888888,"#fdca26"],[1.0,"#f0f921"]]}],"surface":[{"type":"surface","colorbar":{"outlinewidth":0,"ticks":""},"colorscale":[[0.0,"#0d0887"],[0.1111111111111111,"#46039f"],[0.2222222222222222,"#7201a8"],[0.3333333333333333,"#9c179e"],[0.4444444444444444,"#bd3786"],[0.5555555555555556,"#d8576b"],[0.6666666666666666,"#ed7953"],[0.7777777777777778,"#fb9f3a"],[0.8888888888888888,"#fdca26"],[1.0,"#f0f921"]]}],"mesh3d":[{"type":"mesh3d","colorbar":{"outlinewidth":0,"ticks":""}}],"scatter":[{"fillpattern":{"fillmode":"overlay","size":10,"solidity":0.2},"type":"scatter"}],"parcoords":[{"type":"parcoords","line":{"colorbar":{"outlinewidth":0,"ticks":""}}}],"scatterpolargl":[{"type":"scatterpolargl","marker":{"colorbar":{"outlinewidth":0,"ticks":""}}}],"bar":[{"error_x":{"color":"#2a3f5f"},"error_y":{"color":"#2a3f5f"},"marker":{"line":{"color":"#E5ECF6","width":0.5},"pattern":{"fillmode":"overlay","size":10,"solidity":0.2}},"type":"bar"}],"scattergeo":[{"type":"scattergeo","marker":{"colorbar":{"outlinewidth":0,"ticks":""}}}],"scatterpolar":[{"type":"scatterpolar","marker":{"colorbar":{"outlinewidth":0,"ticks":""}}}],"histogram":[{"marker":{"pattern":{"fillmode":"overlay","size":10,"solidity":0.2}},"type":"histogram"}],"scattergl":[{"type":"scattergl","marker":{"colorbar":{"outlinewidth":0,"ticks":""}}}],"scatter3d":[{"type":"scatter3d","line":{"colorbar":{"outlinewidth":0,"ticks":""}},"marker":{"colorbar":{"outlinewidth":0,"ticks":""}}}],"scattermap":[{"type":"scattermap","marker":{"colorbar":{"outlinewidth":0,"ticks":""}}}],"scattermapbox":[{"type":"scattermapbox","marker":{"colorbar":{"outlinewidth":0,"ticks":""}}}],"scatterternary":[{"type":"scatterternary","marker":{"colorbar":{"outlinewidth":0,"ticks":""}}}],"scattercarpet":[{"type":"scattercarpet","marker":{"colorbar":{"outlinewidth":0,"ticks":""}}}],"carpet":[{"aaxis":{"endlinecolor":"#2a3f5f","gridcolor":"white","linecolor":"white","minorgridcolor":"white","startlinecolor":"#2a3f5f"},"baxis":{"endlinecolor":"#2a3f5f","gridcolor":"white","linecolor":"white","minorgridcolor":"white","startlinecolor":"#2a3f5f"},"type":"carpet"}],"table":[{"cells":{"fill":{"color":"#EBF0F8"},"line":{"color":"white"}},"header":{"fill":{"color":"#C8D4E3"},"line":{"color":"white"}},"type":"table"}],"barpolar":[{"marker":{"line":{"color":"#E5ECF6","width":0.5},"pattern":{"fillmode":"overlay","size":10,"solidity":0.2}},"type":"barpolar"}],"pie":[{"automargin":true,"type":"pie"}]},"layout":{"autotypenumbers":"strict","colorway":["#636efa","#EF553B","#00cc96","#ab63fa","#FFA15A","#19d3f3","#FF6692","#B6E880","#FF97FF","#FECB52"],"font":{"color":"#2a3f5f"},"hovermode":"closest","hoverlabel":{"align":"left"},"paper_bgcolor":"white","plot_bgcolor":"#E5ECF6","polar":{"bgcolor":"#E5ECF6","angularaxis":{"gridcolor":"white","linecolor":"white","ticks":""},"radialaxis":{"gridcolor":"white","linecolor":"white","ticks":""}},"ternary":{"bgcolor":"#E5ECF6","aaxis":{"gridcolor":"white","linecolor":"white","ticks":""},"baxis":{"gridcolor":"white","linecolor":"white","ticks":""},"caxis":{"gridcolor":"white","linecolor":"white","ticks":""}},"coloraxis":{"colorbar":{"outlinewidth":0,"ticks":""}},"colorscale":{"sequential":[[0.0,"#0d0887"],[0.1111111111111111,"#46039f"],[0.2222222222222222,"#7201a8"],[0.3333333333333333,"#9c179e"],[0.4444444444444444,"#bd3786"],[0.5555555555555556,"#d8576b"],[0.6666666666666666,"#ed7953"],[0.7777777777777778,"#fb9f3a"],[0.8888888888888888,"#fdca26"],[1.0,"#f0f921"]],"sequentialminus":[[0.0,"#0d0887"],[0.1111111111111111,"#46039f"],[0.2222222222222222,"#7201a8"],[0.3333333333333333,"#9c179e"],[0.4444444444444444,"#bd3786"],[0.5555555555555556,"#d8576b"],[0.6666666666666666,"#ed7953"],[0.7777777777777778,"#fb9f3a"],[0.8888888888888888,"#fdca26"],[1.0,"#f0f921"]],"diverging":[[0,"#8e0152"],[0.1,"#c51b7d"],[0.2,"#de77ae"],[0.3,"#f1b6da"],[0.4,"#fde0ef"],[0.5,"#f7f7f7"],[0.6,"#e6f5d0"],[0.7,"#b8e186"],[0.8,"#7fbc41"],[0.9,"#4d9221"],[1,"#276419"]]},"xaxis":{"gridcolor":"white","linecolor":"white","ticks":"","title":{"standoff":15},"zerolinecolor":"white","automargin":true,"zerolinewidth":2},"yaxis":{"gridcolor":"white","linecolor":"white","ticks":"","title":{"standoff":15},"zerolinecolor":"white","automargin":true,"zerolinewidth":2},"scene":{"xaxis":{"backgroundcolor":"#E5ECF6","gridcolor":"white","linecolor":"white","showbackground":true,"ticks":"","zerolinecolor":"white","gridwidth":2},"yaxis":{"backgroundcolor":"#E5ECF6","gridcolor":"white","linecolor":"white","showbackground":true,"ticks":"","zerolinecolor":"white","gridwidth":2},"zaxis":{"backgroundcolor":"#E5ECF6","gridcolor":"white","linecolor":"white","showbackground":true,"ticks":"","zerolinecolor":"white","gridwidth":2}},"shapedefaults":{"line":{"color":"#2a3f5f"}},"annotationdefaults":{"arrowcolor":"#2a3f5f","arrowhead":0,"arrowwidth":1},"geo":{"bgcolor":"white","landcolor":"#E5ECF6","subunitcolor":"white","showland":true,"showlakes":true,"lakecolor":"white"},"title":{"x":0.05},"mapbox":{"style":"light"}}},"title":{"font":{"size":16,"color":"white"},"text":"Qwen3.6-35B-A3B - KLD vs PPL vs Size"},"scene":{"xaxis":{"title":{"font":{"color":"#228833","size":12},"text":"Size (GiB) → lower is better"},"type":"linear","gridcolor":"rgba(255,255,255,0.08)","zerolinecolor":"rgba(255,255,255,0.08)","showbackground":true,"backgroundcolor":"#1a1a2e"},"yaxis":{"title":{"font":{"color":"#4477AA","size":12},"text":"KLD (log) → lower is better"},"type":"log","gridcolor":"rgba(255,255,255,0.08)","zerolinecolor":"rgba(255,255,255,0.08)","showbackground":true,"backgroundcolor":"#1a1a2e"},"zaxis":{"title":{"font":{"color":"#EE6677","size":12},"text":"PPL (log) → lower is better"},"type":"log","gridcolor":"rgba(255,255,255,0.08)","zerolinecolor":"rgba(255,255,255,0.08)","showbackground":true,"backgroundcolor":"#1a1a2e"},"camera":{"eye":{"x":1.5,"y":1.5,"z":1.2}},"bgcolor":"#1a1a2e"},"font":{"color":"white"},"legend":{"font":{"size":11,"color":"white"},"bgcolor":"rgba(0,0,0,0.6)","bordercolor":"#444","borderwidth":1,"itemsizing":"constant"},"paper_bgcolor":"#1a1a2e","plot_bgcolor":"#1a1a2e","width":1200,"height":900}, {"responsive": true} ) }; </script> </div>
6
+ </body>
7
+ </html>
Qwen3.6-35B-A3B-logits.bin.meta ADDED
@@ -0,0 +1 @@
 
 
1
+ {"dataset": "C:\\Users\\Windows\\Desktop\\backup\\eval_dataset_260428-0143.txt", "dataset_size": 299472}
Qwen3.6-35B-A3B.log ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ # kld-sweep log - Qwen3.6-35B-A3B
2
+
3
+ - [SKIP] Thireus_4.0579bpw - already in results
4
+ - [SKIP] Thireus_4.5077bpw - already in results
5
+ - [SKIP] Thireus_4.8273bpw - already in results
6
+ - [SKIP] Thireus_5.1174bpw - already in results
7
+ - [SKIP] Thireus_5.5079bpw - already in results
8
+ - [SKIP] Thireus_5.7548bpw - already in results
9
+ - [SKIP] Thireus_6.0569bpw - already in results
10
+ - [SKIP] Thireus_6.7626bpw - already in results
Qwen3.6-35B-A3B_report.md ADDED
@@ -0,0 +1,93 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # KLD-Sweep Report - Qwen3.6-35B-A3B
2
+
3
+ MDL_norm = Size_GiB x 8 + log2(PPL) [bits/token, amortised over 1B tokens]
4
+
5
+ ## Results (sorted by MDL_norm)
6
+
7
+ | Rank | Quantization | Size (GiB) | BPW | PPL | KLD | KLD 99.9% | MDL_norm |
8
+ |------|--------------|------------|-----|-----|-----|-----------|----------|
9
+ | 1 | mudler_APEX-I-Mini | 13.333 | 3.302 | 7.7776 | 0.087271 | 3.065409 | 109.623 |
10
+ | 2 | mudler_APEX-I-Compact | 16.105 | 3.989 | 7.4799 | 0.043432 | 1.820640 | 131.743 |
11
+ | 3 | mudler_APEX-Compact | 16.105 | 3.989 | 7.6257 | 0.062095 | 2.529670 | 131.771 |
12
+ | 4 | Thireus_4.0579bpw | 16.384 | 4.058 | 7.7631 | 0.066857 | 2.273288 | 134.029 |
13
+ | 5 | AesSedai_IQ4_XS | 16.405 | 4.063 | 7.5700 | 0.035996 | 1.669282 | 134.160 |
14
+ | 6 | unsloth_UD-IQ4_XS | 16.513 | 4.090 | 7.5991 | 0.036342 | 1.619864 | 135.030 |
15
+ | 7 | unsloth_UD-IQ4_NL | 16.802 | 4.161 | 7.6022 | 0.036445 | 1.898526 | 137.342 |
16
+ | 8 | mradermacher_i1-IQ4_XS | 17.443 | 4.320 | 7.4260 | 0.035131 | 1.520988 | 142.437 |
17
+ | 9 | batiai_IQ4_XS | 17.443 | 4.320 | 7.4511 | 0.036061 | 1.912124 | 142.441 |
18
+ | 10 | bartowski_IQ4_XS | 17.515 | 4.338 | 7.4094 | 0.032072 | 1.813745 | 143.009 |
19
+ | 11 | unsloth_UD-IQ4_NL_XL | 18.161 | 4.498 | 7.4770 | 0.025694 | 1.354680 | 148.190 |
20
+ | 12 | Thireus_4.5077bpw | 18.262 | 4.523 | 7.6018 | 0.046067 | 1.014056 | 149.022 |
21
+ | 13 | sphaela_Q4_0 | 18.361 | 4.548 | 7.4595 | 0.062128 | 3.098408 | 149.787 |
22
+ | 14 | 0xSero_Q4_0 | 18.361 | 4.548 | 7.4866 | 0.068531 | 3.092771 | 149.792 |
23
+ | 15 | sphaela_Q4_K_M | 18.361 | 4.548 | 7.5156 | 0.038733 | 1.833427 | 149.798 |
24
+ | 16 | sphaela_Q4_K_S | 18.361 | 4.548 | 7.5156 | 0.038733 | 1.833427 | 149.798 |
25
+ | 17 | mradermacher_i1-Q4_0 | 18.440 | 4.567 | 7.4737 | 0.059360 | 3.349420 | 150.422 |
26
+ | 18 | bartowski_IQ4_NL | 18.497 | 4.582 | 7.4112 | 0.031247 | 1.591901 | 150.866 |
27
+ | 19 | mradermacher_i1-Q4_K_S | 18.524 | 4.588 | 7.4998 | 0.035967 | 1.891432 | 151.099 |
28
+ | 20 | worthdoing_Q4_K_S | 18.524 | 4.588 | 7.7884 | 0.068062 | 3.560123 | 151.153 |
29
+ | 21 | bartowski_Q4_0 | 18.573 | 4.600 | 7.3794 | 0.040132 | 2.292114 | 151.467 |
30
+ | 22 | 0xSero_IQ4_NL | 18.578 | 4.602 | 7.4506 | 0.047391 | 2.141885 | 151.521 |
31
+ | 23 | MXFP4_MOE | 18.875 | 4.675 | 7.3723 | 0.037835 | 1.747079 | 153.882 |
32
+ | 24 | 0xSero_DYNAMIC | 19.075 | 4.725 | 7.4837 | 0.042753 | 2.160737 | 155.504 |
33
+ | 25 | bartowski_Q4_K_S | 19.178 | 4.750 | 7.4696 | 0.027690 | 1.507139 | 156.325 |
34
+ | 26 | unsloth_UD-Q4_K_S | 19.458 | 4.820 | 7.4220 | 0.020062 | 1.255272 | 158.556 |
35
+ | 27 | Thireus_4.8273bpw | 19.551 | 4.843 | 7.5792 | 0.043324 | 0.879808 | 159.330 |
36
+ | 28 | mradermacher_i1-Q4_K_M | 19.713 | 4.883 | 7.4637 | 0.031677 | 1.500736 | 160.604 |
37
+ | 29 | batiai_Q4_K_M | 19.713 | 4.883 | 7.4642 | 0.031505 | 1.606371 | 160.604 |
38
+ | 30 | lmstudio_Q4_K_M | 19.713 | 4.883 | 7.6538 | 0.055895 | 2.917688 | 160.640 |
39
+ | 31 | 0xSero_Q4_K_M | 19.713 | 4.883 | 7.6538 | 0.055895 | 2.917688 | 160.640 |
40
+ | 32 | worthdoing_Q4_K_M | 19.713 | 4.883 | 7.6606 | 0.056077 | 2.750742 | 160.641 |
41
+ | 33 | bartowski_Q4_K_M | 19.922 | 4.935 | 7.4335 | 0.025066 | 1.385922 | 162.270 |
42
+ | 34 | steampunque_Q4_K_H | 19.925 | 4.935 | 7.5384 | 0.041208 | 2.585083 | 162.314 |
43
+ | 35 | unsloth_MXFP4_MOE | 20.215 | 5.007 | 7.3468 | 0.026420 | 1.186455 | 164.597 |
44
+ | 36 | bartowski_Q4_K_L | 20.274 | 5.022 | 7.3952 | 0.022723 | 1.161044 | 165.079 |
45
+ | 37 | sphaela_Q4_1 | 20.348 | 5.040 | 7.5230 | 0.082678 | 3.324150 | 165.695 |
46
+ | 38 | mradermacher_i1-Q4_1 | 20.348 | 5.040 | 7.5298 | 0.038358 | 2.079206 | 165.697 |
47
+ | 39 | bartowski_Q4_1 | 20.465 | 5.069 | 7.4388 | 0.030026 | 1.434557 | 166.615 |
48
+ | 40 | unsloth_UD-Q4_K_M | 20.614 | 5.106 | 7.4003 | 0.016585 | 0.791560 | 167.800 |
49
+ | 41 | AesSedai_Q4_K_M | 20.624 | 5.109 | 7.3671 | 0.016405 | 0.962259 | 167.873 |
50
+ | 42 | Thireus_5.1174bpw | 20.659 | 5.117 | 7.5287 | 0.041167 | 0.928671 | 168.184 |
51
+ | 43 | unsloth_UD-Q4_K_XL | 20.825 | 5.158 | 7.3936 | 0.016808 | 1.070779 | 169.486 |
52
+ | 44 | mudler_APEX-I-Quality | 21.252 | 5.264 | 7.3348 | 0.017030 | 1.277997 | 172.891 |
53
+ | 45 | mudler_APEX-Quality | 21.252 | 5.264 | 7.3965 | 0.018793 | 1.241888 | 172.903 |
54
+ | 46 | Thireus_5.5079bpw | 22.235 | 5.508 | 7.5635 | 0.039310 | 0.820752 | 180.799 |
55
+ | 47 | mradermacher_i1-Q5_K_S | 22.334 | 5.533 | 7.3590 | 0.020913 | 1.305873 | 181.552 |
56
+ | 48 | worthdoing_Q5_K_S | 22.334 | 5.533 | 7.4318 | 0.027020 | 1.514734 | 181.566 |
57
+ | 49 | sphaela_Q5_0 | 22.334 | 5.533 | 7.4779 | 0.030836 | 2.128659 | 181.575 |
58
+ | 50 | sphaela_Q5_K_M | 22.334 | 5.533 | 7.7613 | 0.063122 | 2.978244 | 181.628 |
59
+ | 51 | sphaela_Q5_K_S | 22.334 | 5.533 | 7.7613 | 0.063122 | 2.978244 | 181.628 |
60
+ | 52 | bartowski_Q5_K_S | 22.497 | 5.573 | 7.3770 | 0.016080 | 0.877640 | 182.859 |
61
+ | 53 | mradermacher_i1-Q5_K_M | 23.031 | 5.705 | 7.3551 | 0.020523 | 1.355754 | 187.127 |
62
+ | 54 | batiai_Q5_K_M | 23.031 | 5.705 | 7.3827 | 0.018182 | 1.007116 | 187.132 |
63
+ | 55 | worthdoing_Q5_K_M | 23.031 | 5.705 | 7.4204 | 0.025840 | 1.453986 | 187.139 |
64
+ | 56 | 0xSero_Q5_K_M | 23.031 | 5.705 | 7.4258 | 0.026154 | 1.687057 | 187.141 |
65
+ | 57 | unsloth_UD-Q5_K_S | 23.229 | 5.754 | 7.3434 | 0.012991 | 0.971944 | 188.708 |
66
+ | 58 | Thireus_5.7548bpw | 23.231 | 5.755 | 7.5646 | 0.038382 | 0.957410 | 188.767 |
67
+ | 59 | bartowski_Q5_K_M | 23.299 | 5.772 | 7.3819 | 0.014800 | 0.816861 | 189.276 |
68
+ | 60 | bartowski_Q5_K_L | 23.592 | 5.844 | 7.3517 | 0.014274 | 1.021982 | 191.614 |
69
+ | 61 | mudler_APEX-I-Balanced | 23.865 | 5.912 | 7.3451 | 0.015009 | 1.151828 | 193.797 |
70
+ | 62 | mudler_APEX-Balanced | 23.865 | 5.912 | 7.3853 | 0.016136 | 0.978521 | 193.805 |
71
+ | 63 | sphaela_Q5_1 | 24.321 | 6.025 | 7.3615 | 0.033787 | 2.046225 | 197.448 |
72
+ | 64 | Thireus_6.0569bpw | 24.450 | 6.057 | 7.3701 | 0.010921 | 0.621259 | 198.482 |
73
+ | 65 | AesSedai_Q5_K_M | 24.452 | 6.057 | 7.3560 | 0.011521 | 0.808359 | 198.495 |
74
+ | 66 | unsloth_UD-Q5_K_M | 24.639 | 6.104 | 7.3397 | 0.011592 | 0.777676 | 199.988 |
75
+ | 67 | unsloth_UD-Q5_K_XL | 24.766 | 6.135 | 7.3527 | 0.011761 | 0.770376 | 201.006 |
76
+ | 68 | mradermacher_i1-Q6_K | 26.556 | 6.579 | 7.3649 | 0.013445 | 1.010739 | 215.329 |
77
+ | 69 | batiai_Q6_K | 26.556 | 6.579 | 7.3888 | 0.014525 | 0.874168 | 215.333 |
78
+ | 70 | 0xSero_Q6_K | 26.556 | 6.579 | 7.3970 | 0.014817 | 0.819281 | 215.335 |
79
+ | 71 | lmstudio_Q6_K | 26.556 | 6.579 | 7.3971 | 0.014816 | 0.819281 | 215.335 |
80
+ | 72 | AesSedai_Q6_K | 27.108 | 6.716 | 7.3691 | 0.010935 | 0.785779 | 219.745 |
81
+ | 73 | unsloth_UD-Q6_K | 27.296 | 6.762 | 7.3622 | 0.010109 | 0.751166 | 221.248 |
82
+ | 74 | Thireus_6.7626bpw | 27.298 | 6.763 | 7.3693 | 0.010479 | 0.699136 | 221.266 |
83
+ | 75 | bartowski_Q6_K | 27.989 | 6.934 | 7.3830 | 0.010854 | 0.731767 | 226.796 |
84
+ | 76 | bartowski_Q6_K_L | 28.219 | 6.991 | 7.3683 | 0.010529 | 0.764405 | 228.633 |
85
+ | 77 | unsloth_UD-Q6_K_XL | 29.657 | 7.347 | 7.3781 | 0.009570 | 0.658147 | 240.139 |
86
+ | 78 | sphaela_Q8_0 | 34.369 | 8.515 | 7.3491 | 0.009761 | 0.676150 | 277.830 |
87
+ | 79 | 0xSero_Q8_0 | 34.369 | 8.515 | 7.3553 | 0.009181 | 0.640894 | 277.831 |
88
+ | 80 | lmstudio_Q8_0 | 34.369 | 8.515 | 7.3554 | 0.009182 | 0.640894 | 277.831 |
89
+ | 81 | unsloth_Q8_0 | 34.369 | 8.515 | 7.3606 | 0.009532 | 0.783307 | 277.832 |
90
+ | 82 | batiai_Q8_0 | 34.369 | 8.515 | 7.3624 | 0.009635 | 0.875084 | 277.832 |
91
+ | 83 | worthdoing_Q8_0 | 34.369 | 8.515 | 7.3633 | 0.009321 | 0.691923 | 277.832 |
92
+ | 84 | bartowski_Q8_0 | 34.379 | 8.518 | 7.3544 | 0.009451 | 0.733638 | 277.911 |
93
+ | 85 | unsloth_UD-Q8_K_XL | 35.810 | 8.872 | 7.3609 | 0.009616 | 0.747915 | 289.360 |
Qwen3.6-35B-A3B_results.csv ADDED
@@ -0,0 +1,86 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Quantization,Size_GiB,PPL_Score,KLD_Score,MDL_norm,Num_Tokens,KLD_99,BPW
2
+ mradermacher_i1-IQ4_XS,17.443,7.426015,0.035131,142.43658822933267,72192,1.520988,4.320
3
+ mradermacher_i1-Q4_0,18.44,7.473715,0.059360,150.42182554954604,72192,3.349420,4.567
4
+ mradermacher_i1-Q4_K_S,18.524,7.499771,0.035967,151.09884654464742,72192,1.891432,4.588
5
+ mradermacher_i1-Q4_K_M,19.713,7.463653,0.031677,160.603881914001,72192,1.500736,4.883
6
+ mradermacher_i1-Q4_1,20.348,7.529849,0.038358,165.6966209340691,72192,2.079206,5.040
7
+ mradermacher_i1-Q5_K_S,22.334,7.359026,0.020913,181.55151483177727,72192,1.305873,5.533
8
+ mradermacher_i1-Q5_K_M,23.031,7.355089,0.020523,187.12674279886716,72192,1.355754,5.705
9
+ mradermacher_i1-Q6_K,26.556,7.364891,0.013445,215.3286641736083,72192,1.010739,6.579
10
+ batiai_IQ4_XS,17.443,7.451128,0.036061,142.44145884662444,72192,1.912124,4.320
11
+ batiai_Q4_K_M,19.713,7.464193,0.031505,160.60398629012096,72192,1.606371,4.883
12
+ batiai_Q5_K_M,23.031,7.382705,0.018182,187.13214951209437,72192,1.007116,5.705
13
+ batiai_Q6_K,26.556,7.388789,0.014525,215.33333793042567,72192,0.874168,6.579
14
+ batiai_Q8_0,34.369,7.362404,0.009635,277.8321769174488,72192,0.875084,8.515
15
+ sphaela_Q4_0,18.361,7.459525,0.062128,149.7870837669467,72192,3.098408,4.548
16
+ sphaela_Q4_K_M,18.361,7.515641,0.038733,149.79789615511754,72192,1.833427,4.548
17
+ sphaela_Q4_K_S,18.361,7.515641,0.038733,149.79789615511754,72192,1.833427,4.548
18
+ 0xSero_Q4_0,18.361,7.486566,0.068531,149.79230412311435,72192,3.092771,4.548
19
+ worthdoing_Q4_K_S,18.524,7.788397,0.068062,151.15332642480467,72192,3.560123,4.588
20
+ 0xSero_IQ4_NL,18.578,7.450601,0.047391,151.5213568047356,72192,2.141885,4.602
21
+ MXFP4_MOE,18.875,7.372258,0.037835,153.8821065604976,72192,1.747079,4.675
22
+ 0xSero_DYNAMIC,19.075,7.483691,0.042753,155.50374999123892,72192,2.160737,4.725
23
+ 0xSero_Q4_K_M,19.713,7.653804,0.055895,160.64017695668338,72192,2.917688,4.883
24
+ worthdoing_Q4_K_M,19.713,7.660640,0.056077,160.64146492560403,72192,2.750742,4.883
25
+ steampunque_Q4_K_H,19.925,7.538357,0.041208,162.31425011948275,72192,2.585083,4.935
26
+ sphaela_Q4_1,20.348,7.522974,0.082678,165.69530310430446,72192,3.324150,5.040
27
+ sphaela_Q5_0,22.334,7.477889,0.030836,181.57463105633408,72192,2.128659,5.533
28
+ sphaela_Q5_K_M,22.334,7.761252,0.063122,181.62828939835262,72192,2.978244,5.533
29
+ sphaela_Q5_K_S,22.334,7.761252,0.063122,181.62828939835262,72192,2.978244,5.533
30
+ worthdoing_Q5_K_S,22.334,7.431824,0.027020,181.56571633630966,72192,1.514734,5.533
31
+ 0xSero_Q5_K_M,23.031,7.425827,0.026154,187.14055170501902,72192,1.687057,5.705
32
+ worthdoing_Q5_K_M,23.031,7.420394,0.025840,187.13949579153004,72192,1.453986,5.705
33
+ sphaela_Q5_1,24.321,7.361528,0.033787,197.4480052512312,72192,2.046225,6.025
34
+ 0xSero_Q6_K,26.556,7.397018,0.014817,215.3349437864628,72192,0.819281,6.579
35
+ sphaela_Q8_0,34.369,7.349076,0.009761,277.8295628711712,72192,0.676150,8.515
36
+ 0xSero_Q8_0,34.369,7.355320,0.009181,277.8307881086277,72192,0.640894,8.515
37
+ worthdoing_Q8_0,34.369,7.363255,0.009321,277.83234366495816,72192,0.691923,8.515
38
+ AesSedai_IQ4_XS,16.405,7.570040,0.035996,134.16030092341435,72192,1.669282,4.063
39
+ AesSedai_Q4_K_M,20.624,7.367143,0.016405,167.87310524634236,72192,0.962259,5.109
40
+ AesSedai_Q5_K_M,24.452,7.355996,0.011521,198.4949206952499,72192,0.808359,6.057
41
+ AesSedai_Q6_K,27.108,7.369134,0.010935,219.7454950877988,72192,0.785779,6.716
42
+ bartowski_IQ4_XS,17.515,7.409366,0.032072,143.0093501001846,72192,1.813745,4.338
43
+ bartowski_IQ4_NL,18.497,7.411187,0.031247,150.86570462780347,72192,1.591901,4.582
44
+ bartowski_Q4_0,18.573,7.379371,0.040132,151.46749784963876,72192,2.292114,4.600
45
+ bartowski_Q4_K_S,19.178,7.469551,0.027690,156.32502152420034,72192,1.507139,4.750
46
+ bartowski_Q4_K_M,19.922,7.433477,0.025066,162.27003718752047,72192,1.385922,4.935
47
+ bartowski_Q4_K_L,20.274,7.395230,0.022723,165.07859501746626,72192,1.161044,5.022
48
+ bartowski_Q4_1,20.465,7.438778,0.030026,166.615065643089,72192,1.434557,5.069
49
+ bartowski_Q5_K_S,22.497,7.377050,0.016080,182.8590440139536,72192,0.877640,5.573
50
+ bartowski_Q5_K_M,23.299,7.381860,0.014800,189.2759843765403,72192,0.816861,5.772
51
+ bartowski_Q5_K_L,23.592,7.351717,0.014274,191.61408123200306,72192,1.021982,5.844
52
+ bartowski_Q6_K,27.989,7.383049,0.010854,226.7962167334627,72192,0.731767,6.934
53
+ bartowski_Q6_K_L,28.219,7.368314,0.010529,228.63333454305118,72192,0.764405,6.991
54
+ bartowski_Q8_0,34.379,7.354382,0.009451,277.9106041146963,72192,0.733638,8.518
55
+ unsloth_UD-IQ4_XS,16.513,7.599112,0.036342,135.02983084118173,72192,1.619864,4.090
56
+ unsloth_UD-IQ4_NL,16.802,7.602229,0.036445,137.3424224837882,72192,1.898526,4.161
57
+ unsloth_UD-IQ4_NL_XL,18.161,7.476980,0.025694,148.1904556740163,72192,1.354680,4.498
58
+ unsloth_UD-Q4_K_S,19.458,7.422022,0.020062,158.5558122774089,72192,1.255272,4.820
59
+ unsloth_MXFP4_MOE,20.215,7.346848,0.026420,164.5971254268056,72192,1.186455,5.007
60
+ unsloth_UD-Q4_K_M,20.614,7.400288,0.016585,167.79958141778033,72192,0.791560,5.106
61
+ unsloth_UD-Q4_K_XL,20.825,7.393556,0.016808,169.4862684089794,72192,1.070779,5.158
62
+ unsloth_UD-Q5_K_S,23.229,7.343419,0.012991,188.7084519194575,72192,0.971944,5.754
63
+ unsloth_UD-Q5_K_M,24.639,7.339658,0.011592,199.98771284056178,72192,0.777676,6.104
64
+ unsloth_UD-Q5_K_XL,24.766,7.352658,0.011761,201.0062658812704,72192,0.770376,6.135
65
+ unsloth_UD-Q6_K,27.296,7.362207,0.010109,221.2481383139267,72192,0.751166,6.762
66
+ unsloth_UD-Q6_K_XL,29.657,7.378086,0.009570,240.13924660538547,72192,0.658147,7.347
67
+ unsloth_Q8_0,34.369,7.360562,0.009532,277.83181592438814,72192,0.783307,8.515
68
+ unsloth_UD-Q8_K_XL,35.81,7.360872,0.009616,289.3598766841569,72192,0.747915,8.872
69
+ lmstudio_Q4_K_M,19.713,7.653804,0.055895,160.64017695668338,72192,2.917688,4.883
70
+ lmstudio_Q6_K,26.556,7.397056,0.014816,215.33495119786434,72192,0.819281,6.579
71
+ lmstudio_Q8_0,34.369,7.355369,0.009182,277.83079771960604,72192,0.640894,8.515
72
+ mudler_APEX-I-Mini,13.333,7.777609,0.087271,109.6233267086806,72192,3.065409,3.302
73
+ mudler_APEX-Compact,16.105,7.625708,0.062095,131.7708712891263,72192,2.529670,3.989
74
+ mudler_APEX-I-Compact,16.105,7.479947,0.043432,131.74302804777227,72192,1.820640,3.989
75
+ mudler_APEX-Quality,21.252,7.396510,0.018793,172.90284470406928,72192,1.241888,5.264
76
+ mudler_APEX-I-Quality,21.252,7.334849,0.017030,172.89076726594044,72192,1.277997,5.264
77
+ mudler_APEX-Balanced,23.865,7.385297,0.016136,193.80465594019267,72192,0.978521,5.912
78
+ mudler_APEX-I-Balanced,23.865,7.345131,0.015009,193.79678822139624,72192,1.151828,5.912
79
+ Thireus_4.0579bpw,16.384,7.763078,0.066857,134.02862878319652,72192,2.273288,4.058
80
+ Thireus_4.5077bpw,18.262,7.601767,0.046067,149.02233480616593,72192,1.014056,4.523
81
+ Thireus_4.8273bpw,19.551,7.579173,0.043324,159.330040437593,72192,0.879808,4.843
82
+ Thireus_5.1174bpw,20.659,7.528659,0.041167,168.18439291584815,72192,0.928671,5.117
83
+ Thireus_5.5079bpw,22.235,7.563483,0.039310,180.7990507515971,72192,0.820752,5.508
84
+ Thireus_5.7548bpw,23.231,7.564565,0.038382,188.76725712270814,72192,0.957410,5.755
85
+ Thireus_6.0569bpw,24.45,7.370104,0.010921,198.48168497742424,72192,0.621259,6.057
86
+ Thireus_6.7626bpw,27.298,7.369260,0.010479,221.2655197552863,72192,0.699136,6.763
notes.txt ADDED
@@ -0,0 +1,98 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Evaluated on eval_dataset_260428-0143.txt 141 chunks, n_ctx=512, batch_size=2048, n_seq=4
2
+
3
+ Windows 11 26200.8246
4
+ Nvidia drivers 596.21
5
+
6
+ ik_llama.cpp
7
+ https://github.com/Thireus/ik_llama.cpp/releases/tag/main-b4660-04d5ead
8
+ Windows x64 (CUDA 12.8) AVX2 - With Libraries
9
+
10
+ ----
11
+
12
+ Perplexity (PPL)
13
+ Measures how surprised the model is by a dataset (prediction quality). Lower is better. It can be converted into bits per token, which is used for MDL.
14
+
15
+ Kullback–Leibler Divergence (KLD)
16
+ Measures how much the probability distribution of outputs changed vs the original FP16 model (faithfulness). Lower is better.
17
+
18
+ Minimum Description Length (MDL)
19
+ Total cost to represent the dataset using the model (efficiency):
20
+ ☝️🤓 Error cost = log₂(PPL) × N ☝️🤓
21
+
22
+ Simply put MDL = Model Cost (bits) + Error Cost (bits) where:
23
+ - Model cost: size of quantized weights (bits)
24
+ - Error cost: extra bits needed due to imperfect predictions (computed from PPL as bits per token) over a lifetime of N tokens (I picked 1 Billion tokens).
25
+
26
+ A quantization scheme optimized for low PPL may still shift the probability distribution, causing a higher KLD even if perplexity looks fine (rare but not impossible). So a good quant would have both a low MDL (efficient) and a low KLD (faithful).
27
+
28
+ Points on the frontier are "Pareto-optimal", no other quant in the dataset beats them on both axes simultaneously. Others are either larger, less faithful, or both.
29
+ Choose a point on this line based on your VRAM and how much fidelity you want.
30
+
31
+ There is no single "best" quant, the right choice depends on whether you prioritize efficiency or fidelity.
32
+
33
+ Note: MDL ranking is context-dependent that's why I share my pseudo-randomly generated dataset for reproducibility (141 chunks at -c 512 generated from eaddario/imatrix-calibration on HF).
34
+
35
+ ----
36
+
37
+ download script
38
+
39
+ mkdir ~/Desktop/backup/models/quants/repo
40
+ cd ~/Desktop/backup/models/quants/repo
41
+ hf download --local-dir . --exclude "*.png" --exclude README.md --exclude .gitattributes --exclude "mmproj*" --exclude "*Q1*.gguf" --exclude "*Q2*.gguf" --exclude "*Q3*.gguf" --exclude "*F16*.gguf" --exclude "*imatrix*" --exclude "*assets*" repo/model-GGUF
42
+
43
+ test script
44
+
45
+ cd C:\Users\Windows\Desktop\backup\references\kld-sweep
46
+ python .\kld_sweep.py --exe C:\Users\Windows\Desktop\backup\ik\llama-perplexity.exe --baseline C:\Users\Windows\Desktop\backup\models\baseline\Qwen_Qwen3.6-35B-A3B-bf16\Qwen_Qwen3.6-35B-A3B-bf16-00001-of-00002.gguf --quants C:\Users\Windows\Desktop\backup\models\quants\ --dataset C:\Users\Windows\Desktop\backup\eval_dataset_260428-0143.txt --output C:\Users\Windows\Desktop\backup\output\ --args="-t 7 -c 512 -ngl 99 -ncmoe 32 --no-mmap" --model-name Qwen3.6-35B-A3B --logit C:\Users\Windows\Desktop\backup\output\Qwen3.6-35B-A3B-logits.bin
47
+
48
+ ----
49
+
50
+ MDL vs Size:
51
+ $ python3 -c "
52
+ import pandas as pd
53
+ import numpy as np
54
+
55
+ df = pd.read_csv('/mnt/c/Users/Windows/Desktop/backup/output/Qwen3.6-35B-A3B_results.csv')
56
+ df = df[df['PPL_Score'] != 'ERROR']
57
+ df['Size_GiB'] = pd.to_numeric(df['Size_GiB'], errors='coerce')
58
+ df['PPL_Score'] = pd.to_numeric(df['PPL_Score'], errors='coerce')
59
+ df['KLD_Score'] = pd.to_numeric(df['KLD_Score'], errors='coerce')
60
+ df['MDL_norm'] = pd.to_numeric(df['MDL_norm'], errors='coerce')
61
+ df = df.dropna(subset=['Size_GiB', 'PPL_Score', 'KLD_Score', 'MDL_norm'])
62
+
63
+ # pearson correlation
64
+ corr = df['Size_GiB'].corr(df['MDL_norm'])
65
+ print(f'Pearson(Size, MDL_norm) = {corr:.6f}')
66
+
67
+ # spearman (rank) correlation
68
+ scorr = df['Size_GiB'].corr(df['MDL_norm'], method='spearman')
69
+ print(f'Spearman(Size, MDL_norm) = {scorr:.6f}')
70
+
71
+ # linear regression r-squared
72
+ from numpy.polynomial.polynomial import polyfit
73
+ b, m = polyfit(df['Size_GiB'].values, df['MDL_norm'].values, 1)
74
+ predicted = b + m * df['Size_GiB'].values
75
+ ss_res = np.sum((df['MDL_norm'].values - predicted) ** 2)
76
+ ss_tot = np.sum((df['MDL_norm'].values - np.mean(df['MDL_norm'].values)) ** 2)
77
+ r2 = 1 - ss_res / ss_totjust paste
78
+ print(f'R²(Size → MDL_norm) = {r2:.6f}')
79
+ print(f'MDL_norm ≈ {m:.3f} × Size + {b:.3f}')
80
+
81
+ # range check
82
+ print(f'Size range: {df[\"Size_GiB\"].min():.1f} - {df[\"Size_GiB\"].max():.1f} GiB')
83
+ print(f'MDL range: {df[\"MDL_norm\"].min():.1f} - {df[\"MDL_norm\"].max():.1f}')
84
+ print(f'PPL range: {df[\"PPL_Score\"].min():.4f} - {df[\"PPL_Score\"].max():.4f}')
85
+ print(f'log2(PPL) range: {np.log2(df[\"PPL_Score\"].min()):.3f} - {np.log2(df[\"PPL_Score\"].max()):.3f}')
86
+ " 2>&1
87
+
88
+ Pearson(Size, MDL_norm) = 1.000000
89
+ Spearman(Size, MDL_norm) = 0.999256
90
+ R²(Size → MDL_norm) = 1.000000
91
+ MDL_norm ≈ 7.998 × Size + 2.942
92
+ Size range: 16.4 - 34.4 GiB
93
+ MDL range: 134.2 - 277.9
94
+ PPL range: 7.3397 - 7.7884
95
+ log2(PPL) range: 2.876 - 2.961
96
+
97
+
98
+ MDL_norm ≈ 8×Size + 2.9 because log2(PPL) is nearly constant across all quants (range 2.88-2.96), so MDL_norm carries not much information beyond size for this model because it's an MoE (with only 8 routed experts out of 256, 8.6% activation ratio). A sparse model like good ol mixtral at 25% would see more variance and a dense model would show much wider PPL.
size_kld_plot_Qwen3.6-35B-A3B.png ADDED

Git LFS Details

  • SHA256: ca408280b062f0213c36da4ed083faed75988ae7a00a2c4c0802ffce2402af32
  • Pointer size: 131 Bytes
  • Size of remote file: 400 kB
size_ppl_plot_Qwen3.6-35B-A3B.png ADDED

Git LFS Details

  • SHA256: 11331ecdc46ee06cdb12497bc43006ac81edfe29e281f2ec7744ae30152b4c7d
  • Pointer size: 131 Bytes
  • Size of remote file: 383 kB