deucebucket commited on
Commit
1d8f09d
·
verified ·
1 Parent(s): 12074d3

results: head-to-head — uniform Q3_K_M of same heretic weights, identical harness

Browse files
benchmark_results_uniform/uniform-q3km-heretic-35b_arc_detailed.jsonl ADDED
The diff for this file is too large to render. See raw diff
 
benchmark_results_uniform/uniform-q3km-heretic-35b_arc_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "benchmark": "arc_challenge",
3
+ "model": "uniform-q3km-heretic-35b",
4
+ "accuracy": 95.56,
5
+ "total": 1172,
6
+ "elapsed_seconds": 210.6,
7
+ "timestamp": "2026-06-11 22:19"
8
+ }
benchmark_results_uniform/uniform-q3km-heretic-35b_evalplus_results.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "benchmark": "evalplus_humaneval_plus",
3
+ "model": "uniform-q3km-heretic-35b",
4
+ "pass_at_1_plus": 57.93,
5
+ "pass_at_1_base": 65.24,
6
+ "total_problems": 164,
7
+ "elapsed_seconds": 235.3,
8
+ "timestamp": "2026-06-11 22:16"
9
+ }
benchmark_results_uniform/uniform-q3km-heretic-35b_evalplus_samples.jsonl ADDED
The diff for this file is too large to render. See raw diff
 
benchmark_results_uniform/uniform-q3km-heretic-35b_evalplus_samples_eval_results.json ADDED
The diff for this file is too large to render. See raw diff
 
benchmark_results_uniform/uniform-q3km-heretic-35b_hellaswag_detailed.jsonl ADDED
The diff for this file is too large to render. See raw diff
 
benchmark_results_uniform/uniform-q3km-heretic-35b_hellaswag_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "benchmark": "hellaswag",
3
+ "model": "uniform-q3km-heretic-35b",
4
+ "accuracy": 91.92,
5
+ "total": 10042,
6
+ "elapsed_seconds": 2336.3,
7
+ "timestamp": "2026-06-11 22:58"
8
+ }
benchmark_results_uniform/uniform-q3km-heretic-35b_mmlu_redux_detailed.jsonl ADDED
The diff for this file is too large to render. See raw diff
 
benchmark_results_uniform/uniform-q3km-heretic-35b_mmlu_redux_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "benchmark": "mmlu_redux",
3
+ "model": "uniform-q3km-heretic-35b",
4
+ "accuracy": 74.88,
5
+ "total": 2400,
6
+ "elapsed_seconds": 487.7,
7
+ "timestamp": "2026-06-11 23:07"
8
+ }