File size: 2,695 Bytes
0585c4e
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
{
  "dtype": "int4_int8_int8",
  "input_info": null,
  "optimum_version": "2.1.0.dev0",
  "output_attentions": false,
  "quantization_config": {
    "_dataset_kwargs": {},
    "dataset": null,
    "default_config": null,
    "ignored_scope": null,
    "num_samples": null,
    "processor": "/nfs/ov-share-01/data/cv_bench_cache/NATIVE_GEN-AI_MODELS/qwen3.5-35b-a3b/pytorch/NATIVE",
    "quantization_configs": {
      "lm_model": {
        "_dataset_kwargs": {},
        "all_layers": null,
        "backup_precision": null,
        "bits": 4,
        "dataset": null,
        "dq_group_size": null,
        "dtype": "int4",
        "gptq": null,
        "group_size": 128,
        "group_size_fallback": null,
        "ignored_scope": {
          "patterns": [
            ".*shared_expert.*",
            ".*attn.*"
          ]
        },
        "lora_correction": null,
        "num_samples": null,
        "processor": null,
        "quant_method": "default",
        "ratio": 1.0,
        "scale_estimation": null,
        "sensitivity_metric": null,
        "statistics_path": null,
        "sym": false,
        "tokenizer": null
      },
      "text_embeddings_model": {
        "_dataset_kwargs": {},
        "all_layers": null,
        "backup_precision": null,
        "bits": 8,
        "dataset": null,
        "dq_group_size": null,
        "dtype": "int8",
        "gptq": null,
        "group_size": null,
        "group_size_fallback": null,
        "ignored_scope": null,
        "lora_correction": null,
        "num_samples": null,
        "processor": null,
        "quant_method": "default",
        "ratio": 1.0,
        "scale_estimation": null,
        "sensitivity_metric": null,
        "statistics_path": null,
        "sym": true,
        "tokenizer": null,
        "weight_only": true
      },
      "vision_embeddings_merger_model": {
        "_dataset_kwargs": {},
        "all_layers": null,
        "backup_precision": null,
        "bits": 8,
        "dataset": null,
        "dq_group_size": null,
        "dtype": "int8",
        "gptq": null,
        "group_size": null,
        "group_size_fallback": null,
        "ignored_scope": null,
        "lora_correction": null,
        "num_samples": null,
        "processor": null,
        "quant_method": "default",
        "ratio": 1.0,
        "scale_estimation": null,
        "sensitivity_metric": null,
        "statistics_path": null,
        "sym": true,
        "tokenizer": null,
        "weight_only": true
      }
    },
    "tokenizer": "/nfs/ov-share-01/data/cv_bench_cache/NATIVE_GEN-AI_MODELS/qwen3.5-35b-a3b/pytorch/NATIVE"
  },
  "save_onnx_model": false,
  "transformers_version": "5.2.0"
}