guignome commited on
Commit
b2a12ff
·
verified ·
1 Parent(s): 949cbe1

Upload folder using huggingface_hub

Browse files
config.json CHANGED
@@ -88,11 +88,9 @@
88
  "num_bits": 8,
89
  "observer": null,
90
  "observer_kwargs": {},
91
- "scale_dtype": null,
92
  "strategy": "token",
93
  "symmetric": true,
94
- "type": "float",
95
- "zp_dtype": null
96
  },
97
  "output_activations": null,
98
  "targets": [
@@ -106,11 +104,9 @@
106
  "num_bits": 8,
107
  "observer": "minmax",
108
  "observer_kwargs": {},
109
- "scale_dtype": null,
110
  "strategy": "channel",
111
  "symmetric": true,
112
- "type": "float",
113
- "zp_dtype": null
114
  }
115
  }
116
  },
@@ -164,7 +160,7 @@
164
  "quantization_status": "compressed",
165
  "sparsity_config": {},
166
  "transform_config": {},
167
- "version": "0.13.0"
168
  },
169
  "residual_multiplier": 0.22,
170
  "rms_norm_eps": 1e-05,
@@ -172,8 +168,8 @@
172
  "rope_theta": 10000,
173
  "router_aux_loss_coef": 0.0,
174
  "shared_intermediate_size": 1024,
175
- "tie_word_embeddings": true,
176
- "transformers_version": "4.57.3",
177
  "use_cache": true,
178
  "vocab_size": 100352
179
  }
 
88
  "num_bits": 8,
89
  "observer": null,
90
  "observer_kwargs": {},
 
91
  "strategy": "token",
92
  "symmetric": true,
93
+ "type": "float"
 
94
  },
95
  "output_activations": null,
96
  "targets": [
 
104
  "num_bits": 8,
105
  "observer": "minmax",
106
  "observer_kwargs": {},
 
107
  "strategy": "channel",
108
  "symmetric": true,
109
+ "type": "float"
 
110
  }
111
  }
112
  },
 
160
  "quantization_status": "compressed",
161
  "sparsity_config": {},
162
  "transform_config": {},
163
+ "version": "0.12.2"
164
  },
165
  "residual_multiplier": 0.22,
166
  "rms_norm_eps": 1e-05,
 
168
  "rope_theta": 10000,
169
  "router_aux_loss_coef": 0.0,
170
  "shared_intermediate_size": 1024,
171
+ "tie_word_embeddings": false,
172
+ "transformers_version": "4.56.2",
173
  "use_cache": true,
174
  "vocab_size": 100352
175
  }
generation_config.json CHANGED
@@ -3,5 +3,5 @@
3
  "bos_token_id": 100257,
4
  "eos_token_id": 100257,
5
  "pad_token_id": 100256,
6
- "transformers_version": "4.57.3"
7
  }
 
3
  "bos_token_id": 100257,
4
  "eos_token_id": 100257,
5
  "pad_token_id": 100256,
6
+ "transformers_version": "4.56.2"
7
  }
model-00001-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fc81a91ad74206a8fae5d2cbdef72947522b95e5ddd0ad55094783830851d09f
3
  size 4802288912
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cd47d73816b8de7d150a694a45faca5776a5d4123dedb1752db7469d28e5b583
3
  size 4802288912
model-00003-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d5227f3ed491c6b2365e38b4c05f0dc81c91a36cf960c675b9a9030febb3dfc0
3
- size 3529213664
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f8dd18fb7f26fb99a5c14bd9ee4026fe55c3dab8fa6bddfffc588754af3d3946
3
+ size 3837495128
model.safetensors.index.json CHANGED
@@ -1,9 +1,10 @@
1
  {
2
  "metadata": {
3
- "total_parameters": 6939484416,
4
- "total_size": 13138641408
5
  },
6
  "weight_map": {
 
7
  "model.embed_tokens.weight": "model-00001-of-00003.safetensors",
8
  "model.layers.0.block_sparse_moe.input_linear.weight": "model-00001-of-00003.safetensors",
9
  "model.layers.0.block_sparse_moe.output_linear.weight": "model-00001-of-00003.safetensors",
 
1
  {
2
  "metadata": {
3
+ "total_parameters": 7093625088,
4
+ "total_size": 13446922752
5
  },
6
  "weight_map": {
7
+ "lm_head.weight": "model-00003-of-00003.safetensors",
8
  "model.embed_tokens.weight": "model-00001-of-00003.safetensors",
9
  "model.layers.0.block_sparse_moe.input_linear.weight": "model-00001-of-00003.safetensors",
10
  "model.layers.0.block_sparse_moe.output_linear.weight": "model-00001-of-00003.safetensors",