{ "metadata": { "total_parameters": 1485821296, "total_size": 17470903992 }, "weight_map": { "lm_head.weight": "model-00004-of-00004.safetensors", "model.language_model.embed_tokens.weight": "model-00001-of-00004.safetensors", "model.language_model.layers.0.input_layernorm.weight": "model-00001-of-00004.safetensors", "model.language_model.layers.0.linear_attn.A_log": "model-00001-of-00004.safetensors", "model.language_model.layers.0.linear_attn.conv1d.weight": "model-00001-of-00004.safetensors", "model.language_model.layers.0.linear_attn.dt_bias": "model-00001-of-00004.safetensors", "model.language_model.layers.0.linear_attn.in_proj_a.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.linear_attn.in_proj_a.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.linear_attn.in_proj_a.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.linear_attn.in_proj_b.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.linear_attn.in_proj_b.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.linear_attn.in_proj_b.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.linear_attn.in_proj_qkv.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.linear_attn.in_proj_qkv.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.linear_attn.in_proj_qkv.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.linear_attn.in_proj_z.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.linear_attn.in_proj_z.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.linear_attn.in_proj_z.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.linear_attn.norm.weight": "model-00001-of-00004.safetensors", "model.language_model.layers.0.linear_attn.out_proj.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.linear_attn.out_proj.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.linear_attn.out_proj.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.0.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.0.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.0.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.1.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.1.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.1.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.10.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.10.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.10.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.100.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.100.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.100.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.101.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.101.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.101.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.102.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.102.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.102.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.103.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.103.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.103.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.104.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.104.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.104.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.105.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.105.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.105.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.106.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.106.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.106.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.107.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.107.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.107.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.108.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.108.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.108.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.109.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.109.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.109.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.11.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.11.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.11.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.110.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.110.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.110.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.111.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.111.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.111.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.112.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.112.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.112.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.113.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.113.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.113.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.114.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.114.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.114.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.115.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.115.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.115.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.116.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.116.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.116.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.117.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.117.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.117.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.118.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.118.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.118.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.119.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.119.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.119.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.12.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.12.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.12.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.120.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.120.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.120.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.121.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.121.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.121.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.122.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.122.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.122.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.123.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.123.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.123.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.124.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.124.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.124.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.125.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.125.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.125.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.126.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.126.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.126.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.127.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.127.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.127.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.128.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.128.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.128.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.129.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.129.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.129.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.13.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.13.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.13.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.130.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.130.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.130.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.131.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.131.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.131.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.132.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.132.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.132.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.133.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.133.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.133.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.134.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.134.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.134.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.135.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.135.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.135.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.136.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.136.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.136.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.137.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.137.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.137.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.138.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.138.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.138.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.139.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.139.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.139.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.14.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.14.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.14.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.140.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.140.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.140.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.141.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.141.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.141.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.142.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.142.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.142.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.143.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.143.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.143.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.144.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.144.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.144.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.145.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.145.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.145.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.146.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.146.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.146.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.147.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.147.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.147.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.148.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.148.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.148.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.149.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.149.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.149.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.15.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.15.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.15.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.150.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.150.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.150.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.151.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.151.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.151.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.152.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.152.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.152.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.153.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.153.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.153.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.154.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.154.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.154.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.155.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.155.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.155.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.156.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.156.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.156.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.157.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.157.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.157.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.158.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.158.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.158.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.159.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.159.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.159.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.16.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.16.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.16.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.160.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.160.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.160.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.161.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.161.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.161.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.162.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.162.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.162.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.163.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.163.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.163.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.164.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.164.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.164.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.165.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.165.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.165.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.166.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.166.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.166.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.167.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.167.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.167.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.168.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.168.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.168.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.169.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.169.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.169.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.17.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.17.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.17.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.170.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.170.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.170.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.171.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.171.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.171.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.172.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.172.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.172.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.173.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.173.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.173.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.174.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.174.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.174.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.175.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.175.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.175.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.176.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.176.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.176.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.177.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.177.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.177.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.178.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.178.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.178.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.179.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.179.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.179.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.18.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.18.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.18.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.180.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.180.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.180.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.181.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.181.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.181.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.182.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.182.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.182.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.183.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.183.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.183.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.184.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.184.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.184.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.185.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.185.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.185.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.186.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.186.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.186.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.187.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.187.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.187.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.188.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.188.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.188.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.189.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.189.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.189.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.19.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.19.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.19.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.190.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.190.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.190.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.191.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.191.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.191.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.192.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.192.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.192.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.193.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.193.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.193.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.194.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.194.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.194.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.195.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.195.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.195.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.196.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.196.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.196.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.197.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.197.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.197.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.198.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.198.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.198.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.199.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.199.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.199.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.2.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.2.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.2.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.20.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.20.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.20.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.200.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.200.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.200.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.201.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.201.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.201.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.202.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.202.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.202.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.203.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.203.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.203.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.204.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.204.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.204.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.205.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.205.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.205.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.206.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.206.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.206.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.207.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.207.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.207.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.208.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.208.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.208.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.209.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.209.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.209.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.21.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.21.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.21.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.210.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.210.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.210.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.211.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.211.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.211.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.212.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.212.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.212.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.213.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.213.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.213.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.214.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.214.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.214.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.215.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.215.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.215.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.216.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.216.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.216.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.217.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.217.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.217.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.218.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.218.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.218.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.219.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.219.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.219.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.22.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.22.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.22.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.220.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.220.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.220.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.221.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.221.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.221.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.222.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.222.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.222.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.223.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.223.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.223.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.224.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.224.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.224.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.225.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.225.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.225.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.226.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.226.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.226.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.227.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.227.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.227.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.228.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.228.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.228.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.229.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.229.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.229.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.23.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.23.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.23.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.230.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.230.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.230.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.231.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.231.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.231.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.232.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.232.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.232.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.233.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.233.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.233.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.234.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.234.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.234.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.235.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.235.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.235.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.236.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.236.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.236.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.237.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.237.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.237.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.238.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.238.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.238.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.239.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.239.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.239.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.24.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.24.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.24.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.240.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.240.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.240.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.241.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.241.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.241.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.242.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.242.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.242.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.243.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.243.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.243.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.244.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.244.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.244.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.245.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.245.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.245.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.246.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.246.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.246.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.247.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.247.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.247.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.248.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.248.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.248.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.249.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.249.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.249.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.25.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.25.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.25.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.250.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.250.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.250.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.251.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.251.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.251.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.252.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.252.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.252.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.253.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.253.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.253.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.254.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.254.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.254.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.255.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.255.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.255.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.26.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.26.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.26.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.27.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.27.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.27.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.28.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.28.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.28.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.29.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.29.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.29.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.3.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.3.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.3.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.30.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.30.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.30.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.31.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.31.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.31.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.32.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.32.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.32.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.33.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.33.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.33.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.34.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.34.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.34.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.35.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.35.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.35.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.36.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.36.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.36.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.37.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.37.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.37.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.38.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.38.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.38.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.39.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.39.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.39.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.4.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.4.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.4.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.40.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.40.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.40.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.41.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.41.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.41.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.42.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.42.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.42.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.43.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.43.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.43.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.44.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.44.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.44.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.45.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.45.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.45.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.46.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.46.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.46.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.47.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.47.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.47.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.48.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.48.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.48.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.49.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.49.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.49.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.5.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.5.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.5.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.50.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.50.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.50.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.51.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.51.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.51.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.52.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.52.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.52.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.53.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.53.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.53.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.54.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.54.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.54.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.55.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.55.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.55.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.56.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.56.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.56.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.57.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.57.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.57.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.58.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.58.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.58.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.59.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.59.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.59.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.6.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.6.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.6.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.60.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.60.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.60.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.61.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.61.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.61.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.62.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.62.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.62.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.63.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.63.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.63.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.64.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.64.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.64.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.65.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.65.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.65.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.66.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.66.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.66.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.67.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.67.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.67.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.68.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.68.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.68.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.69.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.69.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.69.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.7.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.7.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.7.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.70.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.70.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.70.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.71.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.71.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.71.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.72.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.72.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.72.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.73.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.73.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.73.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.74.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.74.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.74.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.75.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.75.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.75.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.76.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.76.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.76.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.77.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.77.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.77.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.78.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.78.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.78.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.79.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.79.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.79.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.8.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.8.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.8.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.80.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.80.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.80.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.81.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.81.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.81.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.82.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.82.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.82.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.83.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.83.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.83.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.84.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.84.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.84.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.85.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.85.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.85.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.86.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.86.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.86.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.87.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.87.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.87.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.88.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.88.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.88.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.89.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.89.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.89.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.9.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.9.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.9.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.90.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.90.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.90.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.91.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.91.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.91.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.92.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.92.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.92.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.93.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.93.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.93.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.94.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.94.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.94.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.95.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.95.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.95.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.96.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.96.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.96.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.97.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.97.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.97.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.98.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.98.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.98.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.99.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.99.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.down_proj_list.99.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.0.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.0.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.0.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.1.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.1.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.1.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.10.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.10.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.10.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.100.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.100.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.100.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.101.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.101.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.101.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.102.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.102.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.102.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.103.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.103.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.103.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.104.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.104.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.104.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.105.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.105.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.105.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.106.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.106.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.106.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.107.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.107.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.107.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.108.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.108.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.108.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.109.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.109.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.109.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.11.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.11.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.11.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.110.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.110.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.110.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.111.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.111.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.111.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.112.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.112.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.112.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.113.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.113.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.113.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.114.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.114.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.114.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.115.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.115.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.115.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.116.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.116.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.116.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.117.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.117.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.117.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.118.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.118.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.118.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.119.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.119.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.119.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.12.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.12.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.12.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.120.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.120.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.120.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.121.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.121.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.121.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.122.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.122.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.122.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.123.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.123.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.123.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.124.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.124.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.124.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.125.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.125.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.125.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.126.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.126.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.126.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.127.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.127.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.127.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.128.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.128.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.128.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.129.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.129.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.129.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.13.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.13.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.13.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.130.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.130.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.130.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.131.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.131.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.131.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.132.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.132.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.132.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.133.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.133.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.133.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.134.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.134.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.134.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.135.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.135.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.135.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.136.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.136.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.136.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.137.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.137.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.137.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.138.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.138.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.138.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.139.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.139.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.139.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.14.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.14.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.14.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.140.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.140.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.140.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.141.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.141.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.141.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.142.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.142.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.142.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.143.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.143.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.143.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.144.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.144.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.144.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.145.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.145.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.145.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.146.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.146.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.146.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.147.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.147.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.147.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.148.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.148.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.148.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.149.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.149.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.149.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.15.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.15.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.15.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.150.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.150.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.150.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.151.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.151.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.151.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.152.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.152.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.152.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.153.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.153.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.153.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.154.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.154.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.154.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.155.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.155.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.155.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.156.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.156.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.156.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.157.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.157.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.157.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.158.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.158.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.158.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.159.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.159.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.159.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.16.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.16.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.16.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.160.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.160.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.160.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.161.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.161.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.161.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.162.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.162.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.162.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.163.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.163.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.163.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.164.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.164.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.164.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.165.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.165.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.165.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.166.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.166.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.166.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.167.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.167.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.167.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.168.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.168.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.168.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.169.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.169.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.169.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.17.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.17.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.17.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.170.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.170.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.170.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.171.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.171.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.171.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.172.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.172.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.172.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.173.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.173.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.173.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.174.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.174.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.174.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.175.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.175.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.175.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.176.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.176.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.176.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.177.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.177.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.177.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.178.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.178.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.178.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.179.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.179.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.179.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.18.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.18.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.18.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.180.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.180.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.180.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.181.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.181.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.181.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.182.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.182.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.182.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.183.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.183.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.183.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.184.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.184.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.184.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.185.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.185.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.185.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.186.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.186.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.186.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.187.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.187.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.187.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.188.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.188.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.188.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.189.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.189.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.189.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.19.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.19.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.19.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.190.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.190.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.190.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.191.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.191.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.191.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.192.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.192.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.192.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.193.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.193.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.193.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.194.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.194.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.194.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.195.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.195.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.195.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.196.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.196.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.196.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.197.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.197.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.197.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.198.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.198.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.198.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.199.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.199.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.199.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.2.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.2.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.2.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.20.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.20.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.20.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.200.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.200.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.200.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.201.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.201.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.201.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.202.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.202.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.202.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.203.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.203.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.203.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.204.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.204.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.204.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.205.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.205.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.205.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.206.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.206.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.206.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.207.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.207.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.207.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.208.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.208.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.208.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.209.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.209.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.209.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.21.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.21.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.21.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.210.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.210.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.210.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.211.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.211.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.211.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.212.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.212.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.212.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.213.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.213.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.213.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.214.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.214.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.214.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.215.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.215.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.215.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.216.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.216.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.216.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.217.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.217.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.217.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.218.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.218.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.218.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.219.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.219.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.219.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.22.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.22.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.22.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.220.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.220.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.220.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.221.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.221.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.221.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.222.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.222.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.222.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.223.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.223.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.223.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.224.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.224.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.224.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.225.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.225.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.225.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.226.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.226.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.226.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.227.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.227.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.227.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.228.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.228.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.228.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.229.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.229.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.229.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.23.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.23.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.23.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.230.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.230.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.230.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.231.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.231.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.231.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.232.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.232.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.232.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.233.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.233.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.233.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.234.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.234.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.234.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.235.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.235.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.235.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.236.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.236.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.236.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.237.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.237.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.237.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.238.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.238.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.238.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.239.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.239.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.239.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.24.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.24.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.24.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.240.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.240.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.240.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.241.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.241.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.241.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.242.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.242.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.242.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.243.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.243.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.243.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.244.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.244.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.244.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.245.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.245.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.245.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.246.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.246.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.246.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.247.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.247.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.247.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.248.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.248.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.248.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.249.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.249.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.249.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.25.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.25.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.25.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.250.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.250.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.250.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.251.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.251.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.251.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.252.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.252.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.252.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.253.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.253.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.253.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.254.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.254.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.254.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.255.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.255.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.255.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.26.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.26.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.26.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.27.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.27.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.27.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.28.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.28.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.28.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.29.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.29.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.29.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.3.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.3.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.3.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.30.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.30.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.30.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.31.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.31.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.31.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.32.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.32.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.32.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.33.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.33.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.33.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.34.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.34.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.34.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.35.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.35.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.35.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.36.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.36.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.36.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.37.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.37.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.37.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.38.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.38.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.38.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.39.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.39.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.39.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.4.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.4.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.4.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.40.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.40.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.40.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.41.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.41.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.41.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.42.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.42.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.42.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.43.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.43.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.43.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.44.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.44.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.44.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.45.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.45.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.45.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.46.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.46.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.46.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.47.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.47.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.47.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.48.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.48.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.48.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.49.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.49.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.49.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.5.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.5.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.5.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.50.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.50.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.50.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.51.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.51.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.51.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.52.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.52.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.52.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.53.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.53.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.53.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.54.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.54.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.54.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.55.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.55.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.55.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.56.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.56.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.56.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.57.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.57.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.57.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.58.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.58.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.58.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.59.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.59.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.59.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.6.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.6.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.6.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.60.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.60.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.60.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.61.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.61.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.61.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.62.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.62.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.62.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.63.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.63.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.63.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.64.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.64.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.64.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.65.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.65.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.65.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.66.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.66.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.66.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.67.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.67.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.67.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.68.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.68.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.68.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.69.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.69.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.69.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.7.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.7.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.7.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.70.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.70.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.70.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.71.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.71.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.71.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.72.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.72.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.72.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.73.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.73.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.73.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.74.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.74.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.74.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.75.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.75.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.75.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.76.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.76.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.76.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.77.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.77.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.77.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.78.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.78.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.78.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.79.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.79.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.79.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.8.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.8.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.8.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.80.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.80.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.80.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.81.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.81.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.81.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.82.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.82.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.82.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.83.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.83.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.83.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.84.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.84.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.84.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.85.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.85.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.85.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.86.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.86.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.86.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.87.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.87.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.87.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.88.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.88.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.88.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.89.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.89.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.89.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.9.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.9.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.9.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.90.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.90.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.90.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.91.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.91.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.91.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.92.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.92.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.92.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.93.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.93.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.93.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.94.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.94.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.94.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.95.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.95.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.95.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.96.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.96.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.96.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.97.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.97.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.97.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.98.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.98.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.98.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.99.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.99.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.experts.gate_up_proj_list.99.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.gate.weight": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.shared_expert.down_proj.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.shared_expert.down_proj.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.shared_expert.down_proj.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.shared_expert.gate_proj.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.shared_expert.gate_proj.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.shared_expert.gate_proj.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.shared_expert.up_proj.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.shared_expert.up_proj.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.shared_expert.up_proj.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.shared_expert_gate.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.shared_expert_gate.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.0.mlp.shared_expert_gate.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.0.post_attention_layernorm.weight": "model-00001-of-00004.safetensors", "model.language_model.layers.1.input_layernorm.weight": "model-00001-of-00004.safetensors", "model.language_model.layers.1.linear_attn.A_log": "model-00001-of-00004.safetensors", "model.language_model.layers.1.linear_attn.conv1d.weight": "model-00001-of-00004.safetensors", "model.language_model.layers.1.linear_attn.dt_bias": "model-00001-of-00004.safetensors", "model.language_model.layers.1.linear_attn.in_proj_a.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.linear_attn.in_proj_a.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.linear_attn.in_proj_a.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.linear_attn.in_proj_b.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.linear_attn.in_proj_b.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.linear_attn.in_proj_b.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.linear_attn.in_proj_qkv.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.linear_attn.in_proj_qkv.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.linear_attn.in_proj_qkv.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.linear_attn.in_proj_z.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.linear_attn.in_proj_z.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.linear_attn.in_proj_z.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.linear_attn.norm.weight": "model-00001-of-00004.safetensors", "model.language_model.layers.1.linear_attn.out_proj.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.linear_attn.out_proj.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.linear_attn.out_proj.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.0.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.0.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.0.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.1.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.1.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.1.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.10.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.10.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.10.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.100.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.100.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.100.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.101.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.101.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.101.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.102.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.102.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.102.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.103.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.103.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.103.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.104.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.104.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.104.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.105.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.105.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.105.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.106.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.106.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.106.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.107.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.107.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.107.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.108.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.108.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.108.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.109.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.109.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.109.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.11.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.11.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.11.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.110.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.110.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.110.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.111.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.111.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.111.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.112.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.112.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.112.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.113.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.113.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.113.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.114.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.114.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.114.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.115.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.115.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.115.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.116.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.116.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.116.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.117.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.117.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.117.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.118.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.118.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.118.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.119.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.119.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.119.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.12.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.12.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.12.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.120.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.120.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.120.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.121.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.121.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.121.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.122.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.122.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.122.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.123.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.123.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.123.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.124.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.124.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.124.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.125.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.125.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.125.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.126.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.126.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.126.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.127.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.127.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.127.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.128.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.128.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.128.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.129.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.129.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.129.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.13.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.13.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.13.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.130.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.130.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.130.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.131.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.131.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.131.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.132.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.132.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.132.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.133.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.133.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.133.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.134.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.134.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.134.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.135.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.135.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.135.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.136.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.136.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.136.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.137.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.137.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.137.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.138.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.138.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.138.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.139.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.139.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.139.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.14.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.14.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.14.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.140.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.140.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.140.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.141.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.141.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.141.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.142.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.142.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.142.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.143.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.143.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.143.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.144.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.144.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.144.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.145.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.145.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.145.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.146.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.146.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.146.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.147.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.147.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.147.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.148.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.148.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.148.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.149.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.149.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.149.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.15.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.15.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.15.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.150.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.150.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.150.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.151.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.151.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.151.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.152.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.152.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.152.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.153.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.153.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.153.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.154.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.154.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.154.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.155.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.155.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.155.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.156.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.156.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.156.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.157.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.157.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.157.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.158.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.158.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.158.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.159.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.159.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.159.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.16.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.16.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.16.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.160.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.160.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.160.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.161.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.161.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.161.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.162.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.162.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.162.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.163.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.163.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.163.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.164.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.164.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.164.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.165.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.165.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.165.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.166.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.166.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.166.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.167.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.167.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.167.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.168.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.168.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.168.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.169.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.169.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.169.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.17.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.17.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.17.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.170.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.170.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.170.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.171.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.171.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.171.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.172.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.172.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.172.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.173.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.173.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.173.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.174.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.174.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.174.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.175.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.175.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.175.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.176.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.176.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.176.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.177.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.177.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.177.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.178.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.178.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.178.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.179.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.179.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.179.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.18.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.18.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.18.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.180.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.180.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.180.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.181.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.181.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.181.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.182.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.182.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.182.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.183.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.183.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.183.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.184.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.184.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.184.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.185.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.185.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.185.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.186.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.186.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.186.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.187.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.187.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.187.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.188.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.188.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.188.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.189.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.189.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.189.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.19.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.19.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.19.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.190.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.190.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.190.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.191.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.191.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.191.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.192.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.192.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.192.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.193.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.193.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.193.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.194.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.194.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.194.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.195.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.195.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.195.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.196.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.196.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.196.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.197.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.197.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.197.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.198.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.198.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.198.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.199.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.199.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.199.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.2.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.2.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.2.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.20.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.20.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.20.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.200.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.200.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.200.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.201.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.201.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.201.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.202.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.202.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.202.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.203.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.203.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.203.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.204.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.204.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.204.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.205.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.205.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.205.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.206.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.206.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.206.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.207.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.207.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.207.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.208.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.208.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.208.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.209.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.209.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.209.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.21.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.21.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.21.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.210.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.210.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.210.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.211.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.211.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.211.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.212.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.212.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.212.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.213.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.213.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.213.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.214.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.214.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.214.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.215.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.215.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.215.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.216.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.216.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.216.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.217.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.217.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.217.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.218.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.218.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.218.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.219.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.219.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.219.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.22.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.22.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.22.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.220.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.220.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.220.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.221.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.221.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.221.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.222.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.222.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.222.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.223.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.223.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.223.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.224.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.224.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.224.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.225.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.225.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.225.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.226.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.226.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.226.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.227.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.227.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.227.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.228.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.228.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.228.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.229.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.229.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.229.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.23.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.23.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.23.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.230.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.230.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.230.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.231.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.231.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.231.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.232.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.232.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.232.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.233.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.233.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.233.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.234.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.234.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.234.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.235.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.235.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.235.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.236.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.236.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.236.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.237.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.237.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.237.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.238.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.238.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.238.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.239.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.239.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.239.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.24.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.24.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.24.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.240.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.240.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.240.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.241.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.241.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.241.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.242.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.242.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.242.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.243.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.243.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.243.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.244.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.244.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.244.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.245.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.245.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.245.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.246.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.246.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.246.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.247.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.247.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.247.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.248.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.248.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.248.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.249.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.249.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.249.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.25.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.25.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.25.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.250.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.250.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.250.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.251.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.251.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.251.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.252.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.252.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.252.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.253.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.253.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.253.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.254.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.254.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.254.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.255.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.255.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.255.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.26.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.26.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.26.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.27.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.27.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.27.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.28.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.28.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.28.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.29.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.29.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.29.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.3.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.3.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.3.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.30.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.30.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.30.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.31.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.31.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.31.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.32.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.32.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.32.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.33.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.33.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.33.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.34.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.34.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.34.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.35.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.35.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.35.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.36.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.36.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.36.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.37.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.37.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.37.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.38.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.38.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.38.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.39.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.39.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.39.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.4.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.4.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.4.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.40.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.40.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.40.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.41.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.41.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.41.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.42.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.42.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.42.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.43.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.43.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.43.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.44.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.44.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.44.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.45.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.45.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.45.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.46.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.46.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.46.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.47.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.47.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.47.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.48.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.48.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.48.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.49.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.49.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.49.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.5.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.5.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.5.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.50.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.50.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.50.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.51.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.51.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.51.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.52.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.52.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.52.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.53.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.53.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.53.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.54.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.54.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.54.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.55.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.55.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.55.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.56.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.56.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.56.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.57.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.57.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.57.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.58.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.58.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.58.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.59.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.59.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.59.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.6.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.6.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.6.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.60.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.60.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.60.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.61.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.61.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.61.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.62.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.62.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.62.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.63.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.63.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.63.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.64.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.64.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.64.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.65.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.65.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.65.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.66.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.66.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.66.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.67.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.67.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.67.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.68.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.68.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.68.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.69.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.69.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.69.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.7.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.7.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.7.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.70.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.70.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.70.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.71.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.71.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.71.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.72.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.72.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.72.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.73.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.73.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.73.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.74.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.74.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.74.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.75.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.75.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.75.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.76.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.76.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.76.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.77.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.77.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.77.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.78.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.78.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.78.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.79.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.79.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.79.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.8.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.8.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.8.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.80.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.80.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.80.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.81.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.81.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.81.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.82.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.82.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.82.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.83.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.83.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.83.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.84.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.84.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.84.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.85.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.85.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.85.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.86.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.86.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.86.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.87.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.87.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.87.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.88.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.88.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.88.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.89.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.89.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.89.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.9.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.9.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.9.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.90.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.90.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.90.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.91.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.91.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.91.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.92.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.92.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.92.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.93.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.93.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.93.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.94.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.94.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.94.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.95.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.95.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.95.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.96.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.96.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.96.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.97.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.97.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.97.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.98.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.98.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.98.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.99.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.99.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.down_proj_list.99.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.0.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.0.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.0.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.1.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.1.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.1.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.10.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.10.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.10.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.100.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.100.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.100.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.101.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.101.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.101.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.102.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.102.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.102.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.103.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.103.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.103.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.104.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.104.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.104.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.105.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.105.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.105.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.106.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.106.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.106.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.107.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.107.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.107.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.108.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.108.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.108.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.109.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.109.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.109.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.11.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.11.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.11.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.110.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.110.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.110.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.111.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.111.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.111.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.112.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.112.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.112.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.113.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.113.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.113.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.114.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.114.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.114.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.115.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.115.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.115.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.116.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.116.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.116.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.117.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.117.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.117.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.118.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.118.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.118.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.119.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.119.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.119.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.12.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.12.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.12.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.120.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.120.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.120.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.121.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.121.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.121.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.122.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.122.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.122.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.123.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.123.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.123.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.124.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.124.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.124.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.125.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.125.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.125.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.126.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.126.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.126.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.127.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.127.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.127.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.128.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.128.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.128.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.129.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.129.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.129.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.13.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.13.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.13.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.130.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.130.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.130.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.131.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.131.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.131.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.132.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.132.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.132.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.133.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.133.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.133.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.134.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.134.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.134.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.135.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.135.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.135.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.136.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.136.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.136.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.137.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.137.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.137.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.138.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.138.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.138.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.139.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.139.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.139.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.14.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.14.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.14.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.140.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.140.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.140.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.141.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.141.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.141.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.142.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.142.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.142.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.143.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.143.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.143.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.144.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.144.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.144.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.145.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.145.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.145.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.146.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.146.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.146.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.147.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.147.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.147.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.148.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.148.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.148.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.149.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.149.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.149.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.15.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.15.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.15.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.150.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.150.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.150.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.151.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.151.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.151.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.152.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.152.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.152.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.153.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.153.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.153.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.154.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.154.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.154.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.155.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.155.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.155.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.156.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.156.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.156.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.157.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.157.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.157.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.158.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.158.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.158.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.159.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.159.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.159.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.16.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.16.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.16.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.160.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.160.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.160.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.161.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.161.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.161.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.162.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.162.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.162.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.163.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.163.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.163.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.164.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.164.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.164.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.165.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.165.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.165.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.166.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.166.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.166.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.167.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.167.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.167.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.168.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.168.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.168.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.169.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.169.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.169.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.17.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.17.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.17.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.170.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.170.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.170.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.171.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.171.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.171.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.172.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.172.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.172.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.173.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.173.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.173.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.174.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.174.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.174.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.175.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.175.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.175.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.176.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.176.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.176.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.177.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.177.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.177.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.178.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.178.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.178.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.179.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.179.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.179.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.18.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.18.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.18.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.180.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.180.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.180.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.181.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.181.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.181.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.182.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.182.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.182.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.183.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.183.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.183.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.184.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.184.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.184.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.185.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.185.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.185.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.186.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.186.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.186.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.187.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.187.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.187.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.188.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.188.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.188.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.189.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.189.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.189.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.19.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.19.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.19.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.190.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.190.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.190.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.191.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.191.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.191.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.192.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.192.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.192.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.193.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.193.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.193.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.194.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.194.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.194.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.195.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.195.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.195.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.196.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.196.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.196.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.197.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.197.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.197.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.198.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.198.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.198.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.199.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.199.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.199.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.2.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.2.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.2.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.20.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.20.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.20.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.200.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.200.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.200.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.201.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.201.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.201.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.202.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.202.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.202.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.203.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.203.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.203.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.204.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.204.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.204.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.205.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.205.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.205.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.206.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.206.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.206.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.207.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.207.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.207.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.208.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.208.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.208.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.209.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.209.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.209.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.21.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.21.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.21.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.210.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.210.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.210.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.211.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.211.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.211.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.212.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.212.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.212.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.213.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.213.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.213.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.214.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.214.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.214.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.215.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.215.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.215.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.216.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.216.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.216.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.217.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.217.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.217.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.218.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.218.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.218.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.219.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.219.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.219.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.22.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.22.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.22.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.220.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.220.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.220.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.221.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.221.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.221.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.222.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.222.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.222.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.223.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.223.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.223.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.224.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.224.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.224.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.225.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.225.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.225.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.226.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.226.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.226.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.227.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.227.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.227.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.228.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.228.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.228.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.229.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.229.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.229.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.23.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.23.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.23.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.230.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.230.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.230.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.231.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.231.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.231.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.232.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.232.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.232.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.233.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.233.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.233.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.234.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.234.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.234.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.235.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.235.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.235.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.236.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.236.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.236.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.237.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.237.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.237.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.238.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.238.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.238.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.239.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.239.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.239.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.24.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.24.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.24.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.240.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.240.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.240.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.241.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.241.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.241.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.242.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.242.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.242.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.243.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.243.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.243.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.244.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.244.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.244.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.245.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.245.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.245.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.246.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.246.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.246.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.247.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.247.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.247.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.248.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.248.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.248.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.249.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.249.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.249.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.25.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.25.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.25.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.250.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.250.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.250.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.251.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.251.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.251.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.252.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.252.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.252.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.253.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.253.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.253.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.254.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.254.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.254.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.255.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.255.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.255.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.26.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.26.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.26.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.27.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.27.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.27.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.28.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.28.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.28.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.29.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.29.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.29.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.3.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.3.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.3.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.30.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.30.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.30.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.31.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.31.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.31.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.32.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.32.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.32.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.33.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.33.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.33.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.34.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.34.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.34.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.35.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.35.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.35.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.36.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.36.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.36.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.37.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.37.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.37.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.38.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.38.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.38.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.39.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.39.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.39.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.4.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.4.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.4.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.40.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.40.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.40.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.41.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.41.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.41.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.42.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.42.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.42.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.43.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.43.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.43.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.44.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.44.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.44.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.45.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.45.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.45.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.46.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.46.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.46.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.47.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.47.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.47.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.48.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.48.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.48.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.49.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.49.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.49.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.5.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.5.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.5.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.50.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.50.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.50.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.51.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.51.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.51.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.52.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.52.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.52.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.53.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.53.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.53.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.54.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.54.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.54.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.55.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.55.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.55.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.56.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.56.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.56.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.57.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.57.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.57.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.58.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.58.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.58.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.59.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.59.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.59.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.6.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.6.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.6.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.60.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.60.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.60.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.61.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.61.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.61.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.62.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.62.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.62.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.63.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.63.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.63.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.64.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.64.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.64.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.65.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.65.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.65.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.66.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.66.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.66.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.67.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.67.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.67.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.68.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.68.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.68.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.69.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.69.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.69.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.7.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.7.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.7.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.70.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.70.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.70.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.71.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.71.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.71.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.72.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.72.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.72.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.73.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.73.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.73.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.74.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.74.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.74.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.75.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.75.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.75.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.76.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.76.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.76.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.77.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.77.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.77.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.78.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.78.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.78.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.79.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.79.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.79.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.8.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.8.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.8.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.80.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.80.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.80.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.81.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.81.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.81.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.82.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.82.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.82.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.83.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.83.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.83.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.84.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.84.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.84.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.85.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.85.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.85.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.86.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.86.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.86.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.87.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.87.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.87.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.88.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.88.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.88.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.89.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.89.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.89.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.9.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.9.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.9.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.90.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.90.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.90.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.91.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.91.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.91.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.92.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.92.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.92.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.93.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.93.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.93.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.94.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.94.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.94.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.95.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.95.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.95.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.96.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.96.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.96.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.97.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.97.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.97.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.98.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.98.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.98.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.99.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.99.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.experts.gate_up_proj_list.99.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.gate.weight": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.shared_expert.down_proj.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.shared_expert.down_proj.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.shared_expert.down_proj.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.shared_expert.gate_proj.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.shared_expert.gate_proj.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.shared_expert.gate_proj.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.shared_expert.up_proj.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.shared_expert.up_proj.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.shared_expert.up_proj.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.shared_expert_gate.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.shared_expert_gate.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.1.mlp.shared_expert_gate.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.1.post_attention_layernorm.weight": "model-00001-of-00004.safetensors", "model.language_model.layers.10.input_layernorm.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.10.linear_attn.A_log": "model-00002-of-00004.safetensors", "model.language_model.layers.10.linear_attn.conv1d.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.10.linear_attn.dt_bias": "model-00002-of-00004.safetensors", "model.language_model.layers.10.linear_attn.in_proj_a.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.linear_attn.in_proj_a.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.linear_attn.in_proj_a.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.linear_attn.in_proj_b.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.linear_attn.in_proj_b.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.linear_attn.in_proj_b.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.linear_attn.in_proj_qkv.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.linear_attn.in_proj_qkv.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.linear_attn.in_proj_qkv.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.linear_attn.in_proj_z.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.linear_attn.in_proj_z.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.linear_attn.in_proj_z.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.linear_attn.norm.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.10.linear_attn.out_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.linear_attn.out_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.linear_attn.out_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.0.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.0.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.0.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.1.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.1.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.1.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.10.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.10.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.10.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.100.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.100.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.100.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.101.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.101.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.101.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.102.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.102.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.102.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.103.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.103.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.103.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.104.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.104.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.104.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.105.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.105.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.105.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.106.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.106.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.106.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.107.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.107.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.107.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.108.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.108.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.108.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.109.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.109.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.109.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.11.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.11.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.11.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.110.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.110.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.110.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.111.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.111.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.111.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.112.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.112.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.112.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.113.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.113.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.113.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.114.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.114.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.114.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.115.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.115.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.115.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.116.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.116.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.116.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.117.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.117.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.117.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.118.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.118.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.118.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.119.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.119.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.119.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.12.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.12.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.12.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.120.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.120.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.120.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.121.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.121.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.121.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.122.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.122.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.122.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.123.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.123.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.123.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.124.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.124.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.124.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.125.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.125.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.125.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.126.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.126.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.126.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.127.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.127.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.127.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.128.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.128.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.128.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.129.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.129.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.129.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.13.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.13.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.13.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.130.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.130.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.130.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.131.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.131.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.131.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.132.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.132.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.132.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.133.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.133.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.133.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.134.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.134.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.134.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.135.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.135.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.135.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.136.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.136.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.136.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.137.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.137.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.137.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.138.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.138.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.138.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.139.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.139.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.139.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.14.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.14.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.14.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.140.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.140.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.140.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.141.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.141.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.141.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.142.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.142.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.142.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.143.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.143.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.143.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.144.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.144.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.144.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.145.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.145.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.145.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.146.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.146.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.146.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.147.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.147.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.147.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.148.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.148.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.148.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.149.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.149.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.149.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.15.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.15.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.15.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.150.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.150.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.150.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.151.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.151.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.151.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.152.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.152.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.152.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.153.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.153.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.153.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.154.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.154.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.154.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.155.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.155.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.155.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.156.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.156.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.156.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.157.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.157.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.157.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.158.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.158.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.158.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.159.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.159.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.159.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.16.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.16.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.16.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.160.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.160.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.160.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.161.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.161.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.161.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.162.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.162.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.162.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.163.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.163.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.163.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.164.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.164.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.164.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.165.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.165.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.165.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.166.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.166.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.166.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.167.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.167.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.167.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.168.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.168.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.168.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.169.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.169.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.169.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.17.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.17.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.17.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.170.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.170.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.170.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.171.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.171.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.171.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.172.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.172.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.172.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.173.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.173.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.173.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.174.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.174.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.174.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.175.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.175.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.175.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.176.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.176.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.176.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.177.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.177.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.177.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.178.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.178.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.178.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.179.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.179.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.179.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.18.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.18.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.18.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.180.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.180.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.180.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.181.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.181.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.181.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.182.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.182.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.182.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.183.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.183.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.183.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.184.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.184.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.184.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.185.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.185.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.185.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.186.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.186.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.186.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.187.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.187.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.187.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.188.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.188.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.188.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.189.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.189.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.189.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.19.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.19.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.19.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.190.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.190.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.190.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.191.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.191.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.191.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.192.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.192.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.192.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.193.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.193.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.193.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.194.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.194.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.194.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.195.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.195.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.195.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.196.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.196.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.196.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.197.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.197.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.197.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.198.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.198.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.198.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.199.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.199.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.199.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.2.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.2.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.2.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.20.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.20.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.20.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.200.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.200.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.200.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.201.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.201.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.201.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.202.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.202.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.202.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.203.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.203.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.203.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.204.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.204.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.204.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.205.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.205.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.205.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.206.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.206.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.206.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.207.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.207.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.207.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.208.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.208.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.208.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.209.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.209.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.209.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.21.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.21.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.21.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.210.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.210.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.210.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.211.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.211.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.211.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.212.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.212.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.212.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.213.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.213.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.213.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.214.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.214.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.214.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.215.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.215.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.215.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.216.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.216.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.216.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.217.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.217.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.217.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.218.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.218.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.218.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.219.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.219.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.219.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.22.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.22.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.22.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.220.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.220.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.220.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.221.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.221.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.221.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.222.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.222.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.222.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.223.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.223.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.223.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.224.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.224.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.224.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.225.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.225.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.225.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.226.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.226.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.226.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.227.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.227.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.227.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.228.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.228.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.228.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.229.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.229.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.229.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.23.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.23.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.23.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.230.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.230.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.230.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.231.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.231.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.231.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.232.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.232.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.232.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.233.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.233.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.233.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.234.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.234.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.234.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.235.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.235.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.235.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.236.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.236.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.236.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.237.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.237.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.237.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.238.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.238.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.238.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.239.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.239.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.239.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.24.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.24.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.24.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.240.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.240.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.240.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.241.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.241.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.241.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.242.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.242.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.242.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.243.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.243.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.243.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.244.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.244.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.244.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.245.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.245.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.245.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.246.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.246.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.246.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.247.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.247.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.247.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.248.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.248.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.248.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.249.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.249.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.249.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.25.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.25.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.25.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.250.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.250.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.250.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.251.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.251.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.251.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.252.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.252.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.252.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.253.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.253.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.253.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.254.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.254.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.254.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.255.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.255.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.255.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.26.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.26.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.26.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.27.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.27.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.27.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.28.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.28.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.28.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.29.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.29.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.29.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.3.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.3.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.3.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.30.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.30.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.30.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.31.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.31.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.31.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.32.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.32.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.32.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.33.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.33.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.33.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.34.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.34.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.34.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.35.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.35.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.35.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.36.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.36.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.36.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.37.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.37.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.37.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.38.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.38.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.38.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.39.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.39.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.39.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.4.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.4.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.4.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.40.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.40.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.40.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.41.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.41.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.41.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.42.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.42.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.42.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.43.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.43.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.43.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.44.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.44.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.44.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.45.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.45.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.45.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.46.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.46.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.46.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.47.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.47.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.47.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.48.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.48.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.48.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.49.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.49.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.49.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.5.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.5.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.5.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.50.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.50.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.50.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.51.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.51.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.51.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.52.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.52.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.52.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.53.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.53.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.53.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.54.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.54.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.54.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.55.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.55.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.55.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.56.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.56.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.56.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.57.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.57.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.57.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.58.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.58.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.58.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.59.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.59.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.59.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.6.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.6.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.6.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.60.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.60.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.60.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.61.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.61.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.61.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.62.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.62.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.62.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.63.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.63.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.63.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.64.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.64.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.64.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.65.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.65.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.65.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.66.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.66.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.66.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.67.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.67.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.67.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.68.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.68.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.68.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.69.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.69.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.69.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.7.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.7.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.7.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.70.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.70.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.70.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.71.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.71.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.71.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.72.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.72.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.72.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.73.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.73.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.73.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.74.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.74.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.74.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.75.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.75.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.75.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.76.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.76.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.76.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.77.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.77.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.77.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.78.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.78.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.78.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.79.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.79.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.79.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.8.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.8.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.8.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.80.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.80.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.80.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.81.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.81.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.81.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.82.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.82.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.82.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.83.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.83.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.83.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.84.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.84.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.84.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.85.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.85.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.85.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.86.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.86.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.86.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.87.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.87.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.87.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.88.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.88.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.88.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.89.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.89.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.89.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.9.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.9.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.9.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.90.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.90.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.90.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.91.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.91.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.91.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.92.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.92.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.92.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.93.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.93.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.93.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.94.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.94.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.94.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.95.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.95.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.95.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.96.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.96.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.96.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.97.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.97.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.97.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.98.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.98.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.98.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.99.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.99.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.down_proj_list.99.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.0.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.0.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.0.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.1.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.1.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.1.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.10.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.10.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.10.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.100.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.100.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.100.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.101.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.101.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.101.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.102.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.102.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.102.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.103.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.103.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.103.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.104.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.104.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.104.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.105.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.105.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.105.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.106.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.106.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.106.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.107.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.107.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.107.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.108.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.108.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.108.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.109.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.109.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.109.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.11.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.11.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.11.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.110.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.110.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.110.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.111.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.111.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.111.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.112.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.112.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.112.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.113.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.113.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.113.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.114.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.114.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.114.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.115.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.115.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.115.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.116.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.116.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.116.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.117.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.117.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.117.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.118.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.118.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.118.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.119.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.119.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.119.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.12.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.12.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.12.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.120.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.120.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.120.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.121.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.121.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.121.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.122.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.122.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.122.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.123.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.123.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.123.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.124.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.124.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.124.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.125.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.125.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.125.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.126.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.126.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.126.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.127.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.127.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.127.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.128.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.128.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.128.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.129.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.129.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.129.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.13.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.13.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.13.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.130.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.130.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.130.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.131.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.131.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.131.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.132.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.132.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.132.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.133.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.133.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.133.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.134.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.134.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.134.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.135.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.135.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.135.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.136.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.136.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.136.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.137.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.137.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.137.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.138.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.138.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.138.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.139.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.139.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.139.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.14.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.14.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.14.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.140.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.140.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.140.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.141.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.141.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.141.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.142.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.142.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.142.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.143.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.143.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.143.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.144.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.144.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.144.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.145.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.145.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.145.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.146.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.146.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.146.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.147.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.147.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.147.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.148.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.148.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.148.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.149.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.149.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.149.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.15.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.15.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.15.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.150.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.150.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.150.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.151.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.151.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.151.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.152.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.152.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.152.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.153.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.153.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.153.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.154.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.154.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.154.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.155.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.155.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.155.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.156.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.156.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.156.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.157.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.157.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.157.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.158.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.158.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.158.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.159.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.159.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.159.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.16.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.16.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.16.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.160.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.160.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.160.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.161.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.161.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.161.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.162.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.162.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.162.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.163.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.163.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.163.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.164.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.164.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.164.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.165.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.165.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.165.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.166.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.166.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.166.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.167.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.167.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.167.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.168.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.168.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.168.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.169.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.169.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.169.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.17.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.17.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.17.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.170.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.170.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.170.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.171.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.171.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.171.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.172.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.172.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.172.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.173.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.173.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.173.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.174.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.174.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.174.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.175.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.175.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.175.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.176.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.176.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.176.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.177.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.177.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.177.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.178.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.178.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.178.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.179.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.179.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.179.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.18.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.18.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.18.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.180.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.180.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.180.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.181.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.181.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.181.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.182.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.182.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.182.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.183.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.183.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.183.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.184.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.184.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.184.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.185.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.185.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.185.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.186.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.186.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.186.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.187.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.187.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.187.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.188.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.188.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.188.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.189.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.189.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.189.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.19.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.19.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.19.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.190.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.190.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.190.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.191.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.191.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.191.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.192.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.192.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.192.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.193.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.193.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.193.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.194.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.194.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.194.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.195.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.195.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.195.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.196.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.196.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.196.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.197.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.197.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.197.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.198.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.198.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.198.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.199.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.199.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.199.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.2.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.2.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.2.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.20.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.20.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.20.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.200.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.200.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.200.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.201.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.201.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.201.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.202.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.202.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.202.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.203.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.203.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.203.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.204.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.204.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.204.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.205.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.205.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.205.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.206.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.206.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.206.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.207.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.207.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.207.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.208.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.208.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.208.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.209.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.209.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.209.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.21.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.21.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.21.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.210.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.210.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.210.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.211.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.211.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.211.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.212.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.212.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.212.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.213.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.213.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.213.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.214.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.214.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.214.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.215.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.215.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.215.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.216.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.216.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.216.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.217.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.217.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.217.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.218.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.218.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.218.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.219.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.219.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.219.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.22.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.22.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.22.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.220.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.220.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.220.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.221.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.221.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.221.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.222.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.222.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.222.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.223.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.223.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.223.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.224.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.224.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.224.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.225.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.225.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.225.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.226.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.226.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.226.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.227.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.227.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.227.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.228.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.228.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.228.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.229.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.229.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.229.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.23.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.23.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.23.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.230.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.230.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.230.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.231.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.231.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.231.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.232.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.232.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.232.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.233.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.233.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.233.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.234.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.234.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.234.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.235.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.235.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.235.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.236.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.236.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.236.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.237.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.237.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.237.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.238.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.238.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.238.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.239.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.239.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.239.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.24.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.24.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.24.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.240.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.240.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.240.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.241.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.241.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.241.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.242.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.242.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.242.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.243.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.243.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.243.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.244.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.244.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.244.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.245.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.245.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.245.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.246.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.246.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.246.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.247.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.247.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.247.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.248.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.248.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.248.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.249.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.249.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.249.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.25.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.25.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.25.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.250.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.250.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.250.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.251.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.251.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.251.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.252.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.252.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.252.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.253.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.253.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.253.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.254.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.254.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.254.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.255.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.255.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.255.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.26.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.26.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.26.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.27.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.27.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.27.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.28.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.28.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.28.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.29.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.29.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.29.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.3.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.3.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.3.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.30.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.30.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.30.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.31.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.31.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.31.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.32.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.32.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.32.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.33.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.33.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.33.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.34.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.34.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.34.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.35.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.35.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.35.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.36.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.36.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.36.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.37.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.37.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.37.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.38.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.38.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.38.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.39.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.39.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.39.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.4.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.4.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.4.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.40.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.40.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.40.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.41.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.41.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.41.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.42.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.42.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.42.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.43.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.43.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.43.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.44.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.44.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.44.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.45.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.45.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.45.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.46.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.46.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.46.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.47.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.47.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.47.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.48.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.48.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.48.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.49.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.49.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.49.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.5.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.5.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.5.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.50.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.50.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.50.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.51.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.51.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.51.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.52.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.52.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.52.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.53.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.53.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.53.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.54.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.54.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.54.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.55.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.55.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.55.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.56.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.56.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.56.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.57.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.57.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.57.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.58.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.58.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.58.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.59.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.59.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.59.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.6.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.6.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.6.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.60.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.60.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.60.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.61.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.61.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.61.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.62.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.62.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.62.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.63.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.63.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.63.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.64.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.64.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.64.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.65.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.65.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.65.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.66.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.66.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.66.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.67.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.67.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.67.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.68.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.68.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.68.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.69.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.69.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.69.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.7.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.7.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.7.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.70.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.70.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.70.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.71.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.71.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.71.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.72.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.72.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.72.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.73.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.73.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.73.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.74.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.74.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.74.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.75.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.75.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.75.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.76.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.76.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.76.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.77.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.77.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.77.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.78.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.78.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.78.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.79.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.79.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.79.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.8.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.8.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.8.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.80.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.80.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.80.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.81.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.81.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.81.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.82.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.82.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.82.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.83.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.83.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.83.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.84.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.84.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.84.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.85.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.85.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.85.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.86.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.86.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.86.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.87.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.87.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.87.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.88.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.88.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.88.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.89.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.89.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.89.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.9.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.9.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.9.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.90.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.90.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.90.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.91.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.91.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.91.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.92.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.92.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.92.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.93.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.93.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.93.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.94.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.94.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.94.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.95.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.95.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.95.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.96.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.96.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.96.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.97.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.97.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.97.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.98.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.98.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.98.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.99.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.99.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.experts.gate_up_proj_list.99.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.gate.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.shared_expert.down_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.shared_expert.down_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.shared_expert.down_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.shared_expert.gate_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.shared_expert.gate_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.shared_expert.gate_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.shared_expert.up_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.shared_expert.up_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.shared_expert.up_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.shared_expert_gate.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.shared_expert_gate.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.10.mlp.shared_expert_gate.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.10.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.11.input_layernorm.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.0.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.0.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.0.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.1.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.1.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.1.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.10.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.10.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.10.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.100.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.100.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.100.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.101.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.101.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.101.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.102.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.102.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.102.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.103.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.103.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.103.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.104.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.104.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.104.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.105.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.105.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.105.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.106.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.106.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.106.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.107.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.107.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.107.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.108.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.108.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.108.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.109.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.109.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.109.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.11.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.11.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.11.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.110.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.110.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.110.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.111.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.111.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.111.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.112.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.112.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.112.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.113.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.113.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.113.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.114.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.114.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.114.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.115.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.115.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.115.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.116.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.116.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.116.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.117.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.117.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.117.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.118.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.118.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.118.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.119.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.119.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.119.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.12.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.12.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.12.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.120.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.120.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.120.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.121.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.121.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.121.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.122.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.122.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.122.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.123.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.123.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.123.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.124.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.124.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.124.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.125.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.125.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.125.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.126.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.126.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.126.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.127.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.127.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.127.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.128.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.128.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.128.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.129.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.129.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.129.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.13.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.13.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.13.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.130.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.130.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.130.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.131.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.131.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.131.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.132.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.132.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.132.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.133.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.133.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.133.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.134.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.134.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.134.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.135.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.135.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.135.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.136.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.136.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.136.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.137.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.137.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.137.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.138.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.138.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.138.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.139.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.139.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.139.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.14.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.14.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.14.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.140.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.140.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.140.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.141.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.141.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.141.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.142.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.142.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.142.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.143.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.143.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.143.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.144.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.144.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.144.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.145.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.145.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.145.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.146.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.146.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.146.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.147.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.147.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.147.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.148.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.148.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.148.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.149.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.149.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.149.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.15.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.15.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.15.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.150.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.150.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.150.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.151.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.151.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.151.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.152.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.152.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.152.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.153.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.153.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.153.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.154.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.154.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.154.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.155.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.155.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.155.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.156.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.156.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.156.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.157.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.157.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.157.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.158.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.158.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.158.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.159.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.159.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.159.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.16.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.16.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.16.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.160.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.160.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.160.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.161.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.161.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.161.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.162.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.162.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.162.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.163.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.163.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.163.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.164.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.164.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.164.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.165.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.165.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.165.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.166.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.166.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.166.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.167.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.167.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.167.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.168.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.168.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.168.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.169.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.169.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.169.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.17.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.17.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.17.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.170.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.170.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.170.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.171.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.171.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.171.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.172.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.172.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.172.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.173.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.173.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.173.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.174.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.174.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.174.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.175.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.175.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.175.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.176.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.176.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.176.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.177.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.177.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.177.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.178.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.178.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.178.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.179.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.179.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.179.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.18.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.18.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.18.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.180.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.180.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.180.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.181.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.181.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.181.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.182.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.182.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.182.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.183.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.183.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.183.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.184.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.184.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.184.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.185.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.185.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.185.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.186.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.186.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.186.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.187.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.187.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.187.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.188.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.188.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.188.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.189.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.189.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.189.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.19.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.19.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.19.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.190.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.190.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.190.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.191.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.191.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.191.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.192.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.192.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.192.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.193.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.193.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.193.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.194.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.194.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.194.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.195.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.195.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.195.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.196.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.196.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.196.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.197.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.197.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.197.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.198.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.198.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.198.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.199.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.199.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.199.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.2.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.2.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.2.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.20.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.20.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.20.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.200.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.200.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.200.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.201.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.201.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.201.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.202.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.202.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.202.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.203.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.203.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.203.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.204.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.204.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.204.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.205.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.205.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.205.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.206.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.206.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.206.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.207.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.207.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.207.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.208.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.208.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.208.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.209.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.209.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.209.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.21.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.21.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.21.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.210.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.210.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.210.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.211.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.211.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.211.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.212.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.212.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.212.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.213.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.213.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.213.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.214.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.214.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.214.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.215.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.215.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.215.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.216.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.216.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.216.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.217.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.217.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.217.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.218.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.218.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.218.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.219.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.219.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.219.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.22.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.22.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.22.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.220.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.220.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.220.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.221.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.221.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.221.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.222.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.222.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.222.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.223.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.223.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.223.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.224.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.224.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.224.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.225.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.225.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.225.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.226.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.226.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.226.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.227.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.227.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.227.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.228.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.228.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.228.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.229.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.229.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.229.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.23.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.23.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.23.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.230.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.230.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.230.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.231.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.231.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.231.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.232.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.232.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.232.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.233.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.233.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.233.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.234.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.234.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.234.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.235.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.235.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.235.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.236.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.236.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.236.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.237.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.237.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.237.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.238.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.238.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.238.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.239.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.239.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.239.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.24.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.24.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.24.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.240.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.240.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.240.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.241.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.241.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.241.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.242.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.242.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.242.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.243.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.243.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.243.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.244.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.244.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.244.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.245.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.245.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.245.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.246.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.246.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.246.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.247.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.247.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.247.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.248.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.248.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.248.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.249.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.249.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.249.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.25.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.25.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.25.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.250.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.250.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.250.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.251.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.251.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.251.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.252.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.252.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.252.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.253.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.253.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.253.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.254.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.254.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.254.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.255.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.255.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.255.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.26.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.26.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.26.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.27.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.27.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.27.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.28.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.28.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.28.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.29.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.29.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.29.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.3.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.3.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.3.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.30.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.30.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.30.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.31.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.31.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.31.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.32.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.32.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.32.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.33.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.33.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.33.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.34.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.34.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.34.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.35.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.35.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.35.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.36.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.36.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.36.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.37.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.37.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.37.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.38.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.38.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.38.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.39.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.39.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.39.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.4.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.4.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.4.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.40.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.40.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.40.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.41.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.41.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.41.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.42.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.42.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.42.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.43.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.43.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.43.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.44.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.44.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.44.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.45.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.45.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.45.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.46.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.46.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.46.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.47.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.47.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.47.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.48.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.48.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.48.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.49.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.49.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.49.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.5.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.5.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.5.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.50.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.50.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.50.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.51.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.51.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.51.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.52.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.52.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.52.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.53.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.53.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.53.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.54.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.54.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.54.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.55.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.55.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.55.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.56.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.56.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.56.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.57.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.57.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.57.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.58.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.58.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.58.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.59.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.59.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.59.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.6.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.6.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.6.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.60.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.60.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.60.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.61.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.61.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.61.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.62.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.62.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.62.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.63.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.63.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.63.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.64.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.64.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.64.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.65.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.65.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.65.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.66.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.66.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.66.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.67.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.67.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.67.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.68.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.68.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.68.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.69.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.69.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.69.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.7.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.7.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.7.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.70.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.70.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.70.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.71.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.71.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.71.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.72.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.72.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.72.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.73.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.73.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.73.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.74.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.74.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.74.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.75.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.75.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.75.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.76.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.76.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.76.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.77.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.77.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.77.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.78.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.78.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.78.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.79.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.79.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.79.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.8.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.8.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.8.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.80.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.80.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.80.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.81.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.81.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.81.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.82.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.82.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.82.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.83.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.83.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.83.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.84.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.84.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.84.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.85.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.85.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.85.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.86.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.86.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.86.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.87.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.87.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.87.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.88.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.88.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.88.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.89.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.89.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.89.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.9.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.9.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.9.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.90.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.90.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.90.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.91.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.91.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.91.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.92.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.92.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.92.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.93.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.93.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.93.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.94.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.94.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.94.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.95.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.95.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.95.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.96.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.96.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.96.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.97.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.97.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.97.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.98.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.98.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.98.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.99.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.99.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.down_proj_list.99.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.0.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.0.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.0.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.1.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.1.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.1.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.10.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.10.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.10.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.100.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.100.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.100.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.101.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.101.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.101.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.102.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.102.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.102.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.103.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.103.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.103.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.104.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.104.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.104.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.105.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.105.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.105.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.106.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.106.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.106.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.107.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.107.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.107.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.108.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.108.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.108.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.109.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.109.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.109.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.11.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.11.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.11.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.110.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.110.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.110.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.111.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.111.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.111.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.112.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.112.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.112.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.113.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.113.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.113.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.114.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.114.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.114.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.115.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.115.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.115.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.116.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.116.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.116.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.117.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.117.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.117.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.118.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.118.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.118.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.119.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.119.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.119.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.12.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.12.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.12.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.120.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.120.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.120.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.121.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.121.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.121.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.122.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.122.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.122.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.123.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.123.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.123.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.124.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.124.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.124.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.125.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.125.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.125.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.126.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.126.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.126.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.127.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.127.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.127.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.128.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.128.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.128.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.129.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.129.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.129.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.13.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.13.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.13.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.130.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.130.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.130.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.131.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.131.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.131.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.132.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.132.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.132.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.133.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.133.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.133.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.134.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.134.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.134.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.135.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.135.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.135.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.136.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.136.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.136.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.137.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.137.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.137.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.138.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.138.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.138.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.139.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.139.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.139.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.14.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.14.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.14.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.140.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.140.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.140.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.141.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.141.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.141.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.142.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.142.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.142.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.143.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.143.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.143.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.144.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.144.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.144.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.145.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.145.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.145.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.146.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.146.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.146.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.147.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.147.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.147.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.148.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.148.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.148.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.149.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.149.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.149.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.15.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.15.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.15.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.150.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.150.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.150.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.151.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.151.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.151.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.152.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.152.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.152.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.153.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.153.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.153.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.154.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.154.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.154.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.155.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.155.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.155.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.156.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.156.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.156.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.157.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.157.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.157.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.158.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.158.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.158.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.159.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.159.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.159.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.16.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.16.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.16.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.160.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.160.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.160.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.161.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.161.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.161.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.162.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.162.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.162.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.163.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.163.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.163.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.164.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.164.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.164.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.165.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.165.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.165.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.166.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.166.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.166.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.167.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.167.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.167.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.168.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.168.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.168.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.169.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.169.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.169.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.17.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.17.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.17.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.170.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.170.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.170.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.171.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.171.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.171.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.172.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.172.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.172.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.173.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.173.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.173.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.174.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.174.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.174.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.175.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.175.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.175.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.176.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.176.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.176.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.177.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.177.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.177.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.178.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.178.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.178.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.179.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.179.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.179.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.18.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.18.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.18.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.180.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.180.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.180.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.181.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.181.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.181.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.182.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.182.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.182.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.183.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.183.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.183.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.184.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.184.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.184.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.185.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.185.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.185.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.186.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.186.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.186.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.187.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.187.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.187.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.188.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.188.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.188.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.189.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.189.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.189.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.19.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.19.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.19.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.190.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.190.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.190.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.191.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.191.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.191.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.192.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.192.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.192.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.193.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.193.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.193.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.194.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.194.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.194.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.195.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.195.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.195.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.196.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.196.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.196.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.197.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.197.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.197.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.198.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.198.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.198.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.199.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.199.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.199.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.2.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.2.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.2.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.20.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.20.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.20.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.200.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.200.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.200.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.201.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.201.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.201.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.202.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.202.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.202.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.203.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.203.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.203.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.204.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.204.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.204.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.205.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.205.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.205.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.206.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.206.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.206.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.207.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.207.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.207.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.208.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.208.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.208.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.209.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.209.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.209.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.21.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.21.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.21.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.210.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.210.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.210.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.211.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.211.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.211.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.212.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.212.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.212.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.213.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.213.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.213.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.214.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.214.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.214.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.215.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.215.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.215.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.216.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.216.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.216.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.217.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.217.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.217.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.218.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.218.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.218.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.219.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.219.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.219.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.22.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.22.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.22.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.220.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.220.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.220.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.221.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.221.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.221.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.222.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.222.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.222.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.223.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.223.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.223.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.224.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.224.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.224.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.225.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.225.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.225.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.226.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.226.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.226.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.227.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.227.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.227.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.228.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.228.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.228.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.229.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.229.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.229.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.23.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.23.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.23.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.230.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.230.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.230.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.231.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.231.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.231.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.232.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.232.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.232.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.233.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.233.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.233.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.234.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.234.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.234.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.235.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.235.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.235.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.236.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.236.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.236.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.237.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.237.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.237.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.238.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.238.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.238.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.239.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.239.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.239.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.24.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.24.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.24.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.240.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.240.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.240.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.241.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.241.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.241.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.242.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.242.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.242.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.243.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.243.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.243.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.244.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.244.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.244.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.245.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.245.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.245.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.246.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.246.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.246.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.247.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.247.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.247.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.248.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.248.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.248.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.249.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.249.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.249.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.25.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.25.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.25.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.250.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.250.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.250.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.251.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.251.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.251.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.252.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.252.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.252.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.253.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.253.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.253.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.254.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.254.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.254.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.255.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.255.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.255.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.26.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.26.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.26.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.27.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.27.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.27.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.28.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.28.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.28.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.29.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.29.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.29.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.3.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.3.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.3.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.30.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.30.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.30.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.31.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.31.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.31.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.32.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.32.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.32.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.33.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.33.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.33.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.34.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.34.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.34.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.35.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.35.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.35.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.36.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.36.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.36.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.37.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.37.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.37.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.38.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.38.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.38.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.39.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.39.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.39.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.4.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.4.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.4.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.40.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.40.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.40.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.41.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.41.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.41.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.42.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.42.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.42.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.43.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.43.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.43.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.44.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.44.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.44.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.45.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.45.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.45.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.46.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.46.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.46.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.47.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.47.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.47.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.48.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.48.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.48.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.49.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.49.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.49.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.5.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.5.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.5.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.50.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.50.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.50.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.51.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.51.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.51.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.52.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.52.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.52.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.53.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.53.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.53.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.54.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.54.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.54.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.55.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.55.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.55.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.56.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.56.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.56.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.57.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.57.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.57.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.58.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.58.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.58.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.59.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.59.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.59.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.6.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.6.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.6.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.60.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.60.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.60.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.61.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.61.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.61.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.62.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.62.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.62.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.63.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.63.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.63.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.64.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.64.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.64.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.65.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.65.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.65.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.66.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.66.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.66.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.67.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.67.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.67.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.68.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.68.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.68.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.69.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.69.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.69.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.7.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.7.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.7.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.70.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.70.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.70.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.71.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.71.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.71.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.72.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.72.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.72.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.73.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.73.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.73.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.74.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.74.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.74.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.75.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.75.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.75.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.76.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.76.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.76.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.77.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.77.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.77.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.78.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.78.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.78.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.79.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.79.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.79.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.8.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.8.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.8.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.80.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.80.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.80.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.81.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.81.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.81.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.82.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.82.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.82.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.83.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.83.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.83.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.84.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.84.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.84.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.85.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.85.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.85.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.86.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.86.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.86.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.87.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.87.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.87.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.88.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.88.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.88.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.89.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.89.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.89.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.9.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.9.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.9.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.90.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.90.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.90.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.91.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.91.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.91.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.92.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.92.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.92.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.93.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.93.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.93.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.94.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.94.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.94.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.95.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.95.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.95.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.96.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.96.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.96.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.97.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.97.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.97.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.98.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.98.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.98.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.99.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.99.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.experts.gate_up_proj_list.99.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.gate.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.shared_expert.down_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.shared_expert.down_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.shared_expert.down_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.shared_expert.gate_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.shared_expert.gate_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.shared_expert.gate_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.shared_expert.up_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.shared_expert.up_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.shared_expert.up_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.shared_expert_gate.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.shared_expert_gate.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.mlp.shared_expert_gate.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.11.self_attn.k_norm.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.11.self_attn.k_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.self_attn.k_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.self_attn.k_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.self_attn.o_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.self_attn.o_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.self_attn.o_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.self_attn.q_norm.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.11.self_attn.q_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.self_attn.q_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.self_attn.q_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.11.self_attn.v_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.11.self_attn.v_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.11.self_attn.v_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.input_layernorm.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.12.linear_attn.A_log": "model-00002-of-00004.safetensors", "model.language_model.layers.12.linear_attn.conv1d.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.12.linear_attn.dt_bias": "model-00002-of-00004.safetensors", "model.language_model.layers.12.linear_attn.in_proj_a.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.linear_attn.in_proj_a.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.linear_attn.in_proj_a.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.linear_attn.in_proj_b.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.linear_attn.in_proj_b.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.linear_attn.in_proj_b.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.linear_attn.in_proj_qkv.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.linear_attn.in_proj_qkv.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.linear_attn.in_proj_qkv.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.linear_attn.in_proj_z.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.linear_attn.in_proj_z.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.linear_attn.in_proj_z.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.linear_attn.norm.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.12.linear_attn.out_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.linear_attn.out_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.linear_attn.out_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.0.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.0.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.0.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.1.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.1.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.1.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.10.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.10.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.10.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.100.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.100.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.100.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.101.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.101.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.101.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.102.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.102.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.102.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.103.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.103.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.103.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.104.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.104.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.104.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.105.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.105.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.105.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.106.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.106.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.106.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.107.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.107.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.107.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.108.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.108.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.108.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.109.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.109.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.109.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.11.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.11.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.11.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.110.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.110.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.110.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.111.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.111.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.111.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.112.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.112.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.112.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.113.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.113.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.113.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.114.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.114.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.114.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.115.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.115.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.115.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.116.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.116.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.116.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.117.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.117.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.117.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.118.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.118.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.118.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.119.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.119.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.119.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.12.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.12.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.12.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.120.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.120.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.120.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.121.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.121.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.121.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.122.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.122.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.122.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.123.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.123.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.123.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.124.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.124.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.124.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.125.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.125.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.125.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.126.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.126.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.126.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.127.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.127.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.127.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.128.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.128.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.128.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.129.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.129.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.129.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.13.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.13.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.13.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.130.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.130.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.130.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.131.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.131.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.131.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.132.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.132.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.132.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.133.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.133.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.133.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.134.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.134.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.134.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.135.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.135.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.135.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.136.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.136.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.136.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.137.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.137.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.137.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.138.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.138.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.138.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.139.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.139.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.139.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.14.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.14.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.14.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.140.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.140.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.140.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.141.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.141.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.141.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.142.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.142.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.142.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.143.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.143.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.143.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.144.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.144.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.144.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.145.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.145.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.145.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.146.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.146.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.146.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.147.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.147.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.147.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.148.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.148.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.148.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.149.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.149.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.149.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.15.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.15.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.15.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.150.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.150.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.150.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.151.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.151.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.151.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.152.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.152.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.152.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.153.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.153.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.153.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.154.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.154.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.154.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.155.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.155.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.155.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.156.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.156.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.156.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.157.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.157.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.157.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.158.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.158.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.158.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.159.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.159.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.159.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.16.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.16.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.16.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.160.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.160.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.160.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.161.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.161.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.161.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.162.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.162.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.162.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.163.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.163.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.163.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.164.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.164.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.164.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.165.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.165.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.165.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.166.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.166.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.166.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.167.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.167.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.167.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.168.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.168.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.168.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.169.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.169.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.169.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.17.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.17.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.17.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.170.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.170.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.170.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.171.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.171.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.171.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.172.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.172.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.172.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.173.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.173.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.173.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.174.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.174.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.174.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.175.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.175.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.175.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.176.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.176.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.176.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.177.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.177.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.177.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.178.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.178.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.178.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.179.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.179.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.179.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.18.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.18.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.18.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.180.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.180.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.180.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.181.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.181.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.181.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.182.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.182.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.182.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.183.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.183.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.183.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.184.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.184.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.184.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.185.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.185.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.185.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.186.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.186.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.186.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.187.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.187.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.187.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.188.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.188.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.188.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.189.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.189.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.189.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.19.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.19.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.19.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.190.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.190.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.190.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.191.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.191.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.191.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.192.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.192.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.192.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.193.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.193.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.193.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.194.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.194.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.194.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.195.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.195.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.195.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.196.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.196.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.196.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.197.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.197.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.197.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.198.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.198.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.198.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.199.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.199.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.199.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.2.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.2.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.2.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.20.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.20.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.20.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.200.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.200.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.200.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.201.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.201.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.201.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.202.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.202.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.202.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.203.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.203.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.203.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.204.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.204.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.204.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.205.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.205.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.205.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.206.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.206.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.206.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.207.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.207.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.207.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.208.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.208.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.208.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.209.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.209.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.209.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.21.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.21.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.21.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.210.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.210.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.210.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.211.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.211.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.211.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.212.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.212.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.212.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.213.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.213.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.213.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.214.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.214.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.214.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.215.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.215.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.215.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.216.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.216.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.216.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.217.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.217.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.217.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.218.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.218.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.218.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.219.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.219.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.219.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.22.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.22.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.22.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.220.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.220.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.220.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.221.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.221.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.221.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.222.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.222.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.222.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.223.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.223.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.223.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.224.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.224.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.224.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.225.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.225.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.225.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.226.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.226.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.226.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.227.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.227.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.227.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.228.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.228.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.228.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.229.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.229.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.229.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.23.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.23.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.23.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.230.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.230.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.230.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.231.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.231.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.231.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.232.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.232.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.232.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.233.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.233.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.233.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.234.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.234.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.234.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.235.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.235.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.235.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.236.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.236.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.236.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.237.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.237.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.237.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.238.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.238.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.238.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.239.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.239.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.239.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.24.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.24.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.24.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.240.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.240.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.240.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.241.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.241.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.241.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.242.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.242.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.242.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.243.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.243.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.243.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.244.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.244.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.244.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.245.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.245.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.245.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.246.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.246.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.246.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.247.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.247.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.247.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.248.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.248.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.248.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.249.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.249.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.249.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.25.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.25.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.25.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.250.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.250.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.250.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.251.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.251.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.251.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.252.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.252.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.252.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.253.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.253.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.253.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.254.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.254.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.254.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.255.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.255.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.255.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.26.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.26.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.26.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.27.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.27.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.27.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.28.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.28.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.28.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.29.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.29.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.29.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.3.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.3.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.3.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.30.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.30.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.30.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.31.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.31.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.31.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.32.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.32.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.32.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.33.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.33.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.33.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.34.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.34.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.34.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.35.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.35.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.35.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.36.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.36.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.36.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.37.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.37.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.37.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.38.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.38.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.38.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.39.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.39.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.39.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.4.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.4.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.4.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.40.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.40.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.40.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.41.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.41.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.41.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.42.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.42.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.42.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.43.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.43.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.43.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.44.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.44.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.44.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.45.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.45.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.45.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.46.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.46.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.46.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.47.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.47.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.47.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.48.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.48.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.48.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.49.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.49.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.49.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.5.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.5.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.5.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.50.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.50.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.50.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.51.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.51.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.51.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.52.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.52.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.52.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.53.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.53.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.53.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.54.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.54.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.54.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.55.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.55.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.55.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.56.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.56.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.56.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.57.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.57.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.57.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.58.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.58.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.58.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.59.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.59.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.59.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.6.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.6.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.6.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.60.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.60.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.60.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.61.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.61.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.61.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.62.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.62.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.62.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.63.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.63.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.63.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.64.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.64.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.64.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.65.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.65.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.65.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.66.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.66.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.66.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.67.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.67.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.67.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.68.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.68.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.68.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.69.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.69.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.69.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.7.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.7.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.7.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.70.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.70.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.70.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.71.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.71.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.71.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.72.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.72.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.72.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.73.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.73.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.73.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.74.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.74.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.74.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.75.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.75.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.75.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.76.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.76.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.76.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.77.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.77.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.77.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.78.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.78.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.78.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.79.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.79.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.79.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.8.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.8.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.8.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.80.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.80.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.80.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.81.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.81.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.81.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.82.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.82.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.82.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.83.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.83.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.83.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.84.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.84.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.84.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.85.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.85.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.85.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.86.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.86.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.86.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.87.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.87.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.87.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.88.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.88.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.88.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.89.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.89.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.89.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.9.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.9.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.9.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.90.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.90.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.90.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.91.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.91.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.91.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.92.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.92.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.92.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.93.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.93.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.93.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.94.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.94.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.94.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.95.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.95.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.95.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.96.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.96.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.96.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.97.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.97.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.97.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.98.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.98.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.98.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.99.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.99.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.down_proj_list.99.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.0.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.0.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.0.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.1.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.1.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.1.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.10.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.10.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.10.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.100.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.100.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.100.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.101.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.101.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.101.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.102.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.102.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.102.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.103.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.103.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.103.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.104.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.104.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.104.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.105.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.105.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.105.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.106.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.106.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.106.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.107.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.107.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.107.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.108.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.108.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.108.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.109.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.109.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.109.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.11.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.11.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.11.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.110.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.110.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.110.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.111.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.111.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.111.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.112.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.112.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.112.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.113.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.113.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.113.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.114.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.114.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.114.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.115.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.115.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.115.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.116.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.116.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.116.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.117.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.117.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.117.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.118.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.118.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.118.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.119.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.119.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.119.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.12.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.12.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.12.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.120.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.120.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.120.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.121.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.121.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.121.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.122.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.122.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.122.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.123.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.123.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.123.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.124.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.124.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.124.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.125.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.125.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.125.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.126.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.126.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.126.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.127.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.127.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.127.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.128.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.128.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.128.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.129.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.129.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.129.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.13.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.13.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.13.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.130.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.130.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.130.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.131.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.131.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.131.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.132.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.132.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.132.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.133.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.133.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.133.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.134.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.134.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.134.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.135.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.135.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.135.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.136.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.136.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.136.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.137.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.137.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.137.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.138.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.138.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.138.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.139.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.139.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.139.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.14.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.14.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.14.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.140.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.140.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.140.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.141.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.141.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.141.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.142.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.142.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.142.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.143.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.143.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.143.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.144.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.144.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.144.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.145.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.145.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.145.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.146.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.146.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.146.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.147.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.147.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.147.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.148.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.148.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.148.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.149.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.149.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.149.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.15.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.15.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.15.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.150.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.150.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.150.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.151.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.151.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.151.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.152.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.152.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.152.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.153.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.153.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.153.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.154.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.154.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.154.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.155.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.155.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.155.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.156.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.156.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.156.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.157.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.157.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.157.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.158.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.158.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.158.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.159.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.159.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.159.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.16.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.16.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.16.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.160.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.160.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.160.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.161.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.161.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.161.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.162.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.162.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.162.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.163.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.163.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.163.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.164.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.164.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.164.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.165.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.165.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.165.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.166.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.166.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.166.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.167.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.167.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.167.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.168.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.168.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.168.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.169.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.169.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.169.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.17.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.17.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.17.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.170.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.170.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.170.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.171.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.171.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.171.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.172.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.172.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.172.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.173.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.173.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.173.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.174.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.174.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.174.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.175.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.175.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.175.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.176.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.176.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.176.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.177.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.177.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.177.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.178.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.178.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.178.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.179.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.179.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.179.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.18.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.18.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.18.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.180.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.180.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.180.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.181.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.181.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.181.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.182.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.182.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.182.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.183.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.183.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.183.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.184.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.184.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.184.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.185.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.185.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.185.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.186.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.186.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.186.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.187.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.187.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.187.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.188.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.188.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.188.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.189.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.189.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.189.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.19.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.19.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.19.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.190.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.190.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.190.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.191.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.191.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.191.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.192.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.192.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.192.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.193.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.193.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.193.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.194.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.194.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.194.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.195.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.195.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.195.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.196.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.196.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.196.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.197.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.197.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.197.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.198.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.198.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.198.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.199.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.199.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.199.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.2.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.2.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.2.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.20.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.20.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.20.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.200.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.200.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.200.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.201.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.201.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.201.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.202.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.202.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.202.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.203.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.203.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.203.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.204.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.204.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.204.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.205.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.205.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.205.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.206.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.206.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.206.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.207.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.207.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.207.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.208.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.208.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.208.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.209.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.209.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.209.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.21.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.21.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.21.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.210.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.210.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.210.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.211.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.211.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.211.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.212.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.212.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.212.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.213.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.213.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.213.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.214.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.214.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.214.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.215.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.215.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.215.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.216.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.216.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.216.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.217.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.217.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.217.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.218.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.218.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.218.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.219.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.219.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.219.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.22.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.22.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.22.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.220.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.220.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.220.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.221.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.221.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.221.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.222.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.222.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.222.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.223.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.223.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.223.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.224.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.224.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.224.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.225.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.225.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.225.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.226.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.226.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.226.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.227.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.227.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.227.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.228.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.228.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.228.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.229.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.229.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.229.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.23.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.23.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.23.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.230.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.230.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.230.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.231.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.231.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.231.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.232.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.232.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.232.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.233.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.233.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.233.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.234.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.234.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.234.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.235.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.235.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.235.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.236.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.236.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.236.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.237.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.237.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.237.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.238.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.238.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.238.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.239.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.239.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.239.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.24.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.24.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.24.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.240.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.240.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.240.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.241.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.241.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.241.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.242.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.242.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.242.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.243.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.243.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.243.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.244.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.244.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.244.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.245.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.245.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.245.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.246.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.246.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.246.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.247.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.247.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.247.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.248.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.248.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.248.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.249.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.249.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.249.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.25.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.25.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.25.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.250.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.250.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.250.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.251.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.251.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.251.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.252.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.252.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.252.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.253.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.253.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.253.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.254.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.254.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.254.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.255.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.255.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.255.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.26.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.26.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.26.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.27.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.27.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.27.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.28.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.28.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.28.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.29.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.29.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.29.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.3.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.3.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.3.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.30.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.30.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.30.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.31.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.31.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.31.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.32.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.32.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.32.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.33.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.33.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.33.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.34.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.34.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.34.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.35.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.35.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.35.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.36.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.36.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.36.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.37.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.37.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.37.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.38.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.38.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.38.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.39.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.39.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.39.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.4.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.4.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.4.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.40.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.40.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.40.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.41.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.41.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.41.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.42.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.42.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.42.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.43.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.43.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.43.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.44.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.44.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.44.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.45.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.45.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.45.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.46.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.46.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.46.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.47.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.47.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.47.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.48.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.48.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.48.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.49.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.49.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.49.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.5.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.5.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.5.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.50.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.50.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.50.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.51.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.51.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.51.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.52.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.52.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.52.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.53.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.53.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.53.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.54.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.54.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.54.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.55.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.55.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.55.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.56.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.56.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.56.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.57.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.57.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.57.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.58.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.58.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.58.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.59.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.59.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.59.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.6.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.6.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.6.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.60.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.60.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.60.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.61.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.61.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.61.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.62.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.62.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.62.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.63.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.63.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.63.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.64.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.64.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.64.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.65.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.65.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.65.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.66.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.66.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.66.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.67.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.67.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.67.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.68.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.68.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.68.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.69.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.69.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.69.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.7.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.7.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.7.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.70.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.70.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.70.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.71.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.71.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.71.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.72.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.72.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.72.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.73.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.73.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.73.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.74.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.74.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.74.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.75.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.75.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.75.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.76.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.76.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.76.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.77.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.77.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.77.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.78.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.78.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.78.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.79.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.79.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.79.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.8.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.8.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.8.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.80.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.80.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.80.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.81.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.81.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.81.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.82.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.82.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.82.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.83.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.83.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.83.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.84.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.84.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.84.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.85.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.85.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.85.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.86.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.86.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.86.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.87.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.87.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.87.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.88.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.88.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.88.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.89.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.89.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.89.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.9.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.9.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.9.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.90.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.90.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.90.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.91.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.91.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.91.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.92.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.92.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.92.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.93.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.93.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.93.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.94.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.94.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.94.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.95.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.95.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.95.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.96.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.96.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.96.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.97.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.97.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.97.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.98.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.98.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.98.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.99.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.99.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.experts.gate_up_proj_list.99.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.gate.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.shared_expert.down_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.shared_expert.down_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.shared_expert.down_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.shared_expert.gate_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.shared_expert.gate_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.shared_expert.gate_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.shared_expert.up_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.shared_expert.up_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.shared_expert.up_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.shared_expert_gate.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.shared_expert_gate.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.12.mlp.shared_expert_gate.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.12.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.13.input_layernorm.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.13.linear_attn.A_log": "model-00002-of-00004.safetensors", "model.language_model.layers.13.linear_attn.conv1d.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.13.linear_attn.dt_bias": "model-00002-of-00004.safetensors", "model.language_model.layers.13.linear_attn.in_proj_a.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.linear_attn.in_proj_a.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.linear_attn.in_proj_a.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.linear_attn.in_proj_b.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.linear_attn.in_proj_b.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.linear_attn.in_proj_b.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.linear_attn.in_proj_qkv.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.linear_attn.in_proj_qkv.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.linear_attn.in_proj_qkv.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.linear_attn.in_proj_z.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.linear_attn.in_proj_z.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.linear_attn.in_proj_z.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.linear_attn.norm.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.13.linear_attn.out_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.linear_attn.out_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.linear_attn.out_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.0.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.0.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.0.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.1.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.1.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.1.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.10.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.10.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.10.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.100.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.100.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.100.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.101.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.101.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.101.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.102.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.102.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.102.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.103.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.103.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.103.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.104.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.104.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.104.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.105.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.105.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.105.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.106.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.106.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.106.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.107.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.107.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.107.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.108.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.108.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.108.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.109.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.109.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.109.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.11.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.11.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.11.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.110.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.110.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.110.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.111.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.111.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.111.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.112.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.112.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.112.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.113.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.113.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.113.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.114.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.114.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.114.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.115.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.115.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.115.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.116.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.116.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.116.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.117.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.117.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.117.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.118.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.118.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.118.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.119.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.119.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.119.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.12.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.12.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.12.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.120.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.120.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.120.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.121.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.121.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.121.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.122.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.122.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.122.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.123.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.123.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.123.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.124.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.124.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.124.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.125.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.125.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.125.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.126.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.126.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.126.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.127.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.127.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.127.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.128.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.128.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.128.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.129.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.129.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.129.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.13.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.13.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.13.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.130.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.130.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.130.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.131.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.131.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.131.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.132.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.132.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.132.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.133.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.133.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.133.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.134.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.134.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.134.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.135.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.135.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.135.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.136.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.136.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.136.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.137.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.137.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.137.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.138.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.138.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.138.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.139.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.139.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.139.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.14.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.14.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.14.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.140.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.140.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.140.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.141.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.141.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.141.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.142.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.142.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.142.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.143.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.143.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.143.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.144.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.144.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.144.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.145.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.145.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.145.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.146.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.146.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.146.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.147.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.147.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.147.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.148.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.148.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.148.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.149.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.149.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.149.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.15.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.15.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.15.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.150.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.150.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.150.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.151.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.151.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.151.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.152.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.152.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.152.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.153.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.153.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.153.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.154.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.154.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.154.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.155.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.155.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.155.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.156.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.156.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.156.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.157.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.157.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.157.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.158.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.158.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.158.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.159.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.159.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.159.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.16.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.16.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.16.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.160.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.160.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.160.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.161.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.161.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.161.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.162.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.162.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.162.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.163.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.163.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.163.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.164.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.164.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.164.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.165.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.165.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.165.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.166.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.166.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.166.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.167.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.167.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.167.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.168.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.168.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.168.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.169.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.169.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.169.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.17.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.17.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.17.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.170.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.170.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.170.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.171.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.171.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.171.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.172.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.172.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.172.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.173.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.173.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.173.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.174.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.174.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.174.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.175.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.175.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.175.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.176.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.176.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.176.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.177.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.177.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.177.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.178.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.178.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.178.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.179.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.179.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.179.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.18.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.18.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.18.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.180.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.180.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.180.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.181.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.181.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.181.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.182.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.182.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.182.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.183.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.183.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.183.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.184.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.184.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.184.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.185.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.185.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.185.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.186.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.186.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.186.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.187.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.187.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.187.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.188.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.188.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.188.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.189.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.189.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.189.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.19.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.19.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.19.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.190.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.190.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.190.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.191.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.191.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.191.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.192.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.192.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.192.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.193.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.193.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.193.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.194.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.194.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.194.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.195.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.195.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.195.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.196.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.196.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.196.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.197.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.197.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.197.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.198.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.198.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.198.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.199.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.199.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.199.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.2.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.2.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.2.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.20.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.20.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.20.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.200.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.200.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.200.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.201.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.201.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.201.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.202.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.202.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.202.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.203.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.203.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.203.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.204.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.204.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.204.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.205.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.205.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.205.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.206.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.206.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.206.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.207.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.207.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.207.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.208.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.208.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.208.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.209.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.209.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.209.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.21.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.21.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.21.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.210.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.210.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.210.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.211.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.211.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.211.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.212.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.212.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.212.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.213.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.213.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.213.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.214.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.214.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.214.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.215.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.215.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.215.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.216.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.216.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.216.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.217.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.217.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.217.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.218.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.218.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.218.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.219.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.219.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.219.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.22.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.22.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.22.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.220.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.220.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.220.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.221.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.221.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.221.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.222.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.222.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.222.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.223.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.223.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.223.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.224.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.224.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.224.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.225.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.225.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.225.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.226.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.226.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.226.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.227.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.227.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.227.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.228.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.228.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.228.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.229.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.229.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.229.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.23.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.23.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.23.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.230.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.230.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.230.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.231.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.231.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.231.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.232.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.232.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.232.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.233.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.233.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.233.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.234.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.234.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.234.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.235.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.235.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.235.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.236.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.236.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.236.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.237.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.237.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.237.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.238.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.238.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.238.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.239.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.239.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.239.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.24.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.24.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.24.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.240.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.240.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.240.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.241.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.241.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.241.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.242.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.242.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.242.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.243.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.243.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.243.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.244.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.244.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.244.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.245.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.245.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.245.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.246.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.246.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.246.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.247.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.247.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.247.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.248.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.248.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.248.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.249.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.249.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.249.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.25.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.25.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.25.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.250.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.250.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.250.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.251.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.251.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.251.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.252.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.252.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.252.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.253.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.253.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.253.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.254.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.254.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.254.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.255.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.255.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.255.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.26.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.26.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.26.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.27.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.27.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.27.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.28.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.28.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.28.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.29.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.29.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.29.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.3.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.3.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.3.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.30.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.30.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.30.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.31.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.31.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.31.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.32.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.32.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.32.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.33.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.33.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.33.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.34.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.34.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.34.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.35.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.35.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.35.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.36.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.36.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.36.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.37.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.37.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.37.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.38.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.38.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.38.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.39.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.39.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.39.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.4.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.4.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.4.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.40.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.40.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.40.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.41.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.41.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.41.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.42.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.42.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.42.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.43.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.43.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.43.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.44.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.44.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.44.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.45.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.45.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.45.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.46.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.46.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.46.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.47.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.47.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.47.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.48.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.48.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.48.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.49.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.49.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.49.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.5.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.5.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.5.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.50.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.50.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.50.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.51.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.51.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.51.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.52.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.52.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.52.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.53.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.53.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.53.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.54.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.54.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.54.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.55.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.55.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.55.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.56.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.56.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.56.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.57.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.57.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.57.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.58.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.58.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.58.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.59.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.59.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.59.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.6.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.6.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.6.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.60.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.60.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.60.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.61.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.61.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.61.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.62.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.62.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.62.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.63.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.63.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.63.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.64.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.64.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.64.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.65.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.65.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.65.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.66.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.66.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.66.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.67.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.67.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.67.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.68.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.68.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.68.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.69.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.69.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.69.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.7.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.7.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.7.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.70.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.70.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.70.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.71.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.71.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.71.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.72.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.72.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.72.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.73.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.73.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.73.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.74.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.74.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.74.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.75.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.75.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.75.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.76.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.76.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.76.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.77.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.77.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.77.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.78.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.78.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.78.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.79.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.79.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.79.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.8.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.8.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.8.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.80.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.80.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.80.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.81.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.81.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.81.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.82.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.82.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.82.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.83.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.83.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.83.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.84.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.84.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.84.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.85.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.85.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.85.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.86.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.86.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.86.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.87.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.87.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.87.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.88.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.88.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.88.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.89.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.89.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.89.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.9.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.9.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.9.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.90.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.90.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.90.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.91.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.91.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.91.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.92.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.92.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.92.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.93.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.93.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.93.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.94.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.94.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.94.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.95.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.95.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.95.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.96.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.96.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.96.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.97.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.97.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.97.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.98.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.98.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.98.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.99.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.99.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.down_proj_list.99.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.0.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.0.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.0.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.1.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.1.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.1.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.10.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.10.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.10.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.100.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.100.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.100.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.101.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.101.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.101.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.102.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.102.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.102.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.103.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.103.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.103.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.104.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.104.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.104.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.105.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.105.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.105.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.106.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.106.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.106.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.107.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.107.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.107.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.108.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.108.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.108.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.109.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.109.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.109.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.11.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.11.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.11.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.110.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.110.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.110.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.111.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.111.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.111.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.112.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.112.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.112.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.113.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.113.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.113.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.114.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.114.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.114.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.115.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.115.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.115.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.116.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.116.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.116.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.117.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.117.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.117.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.118.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.118.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.118.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.119.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.119.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.119.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.12.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.12.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.12.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.120.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.120.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.120.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.121.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.121.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.121.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.122.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.122.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.122.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.123.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.123.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.123.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.124.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.124.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.124.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.125.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.125.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.125.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.126.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.126.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.126.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.127.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.127.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.127.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.128.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.128.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.128.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.129.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.129.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.129.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.13.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.13.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.13.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.130.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.130.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.130.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.131.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.131.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.131.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.132.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.132.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.132.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.133.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.133.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.133.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.134.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.134.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.134.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.135.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.135.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.135.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.136.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.136.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.136.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.137.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.137.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.137.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.138.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.138.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.138.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.139.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.139.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.139.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.14.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.14.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.14.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.140.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.140.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.140.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.141.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.141.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.141.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.142.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.142.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.142.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.143.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.143.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.143.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.144.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.144.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.144.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.145.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.145.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.145.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.146.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.146.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.146.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.147.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.147.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.147.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.148.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.148.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.148.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.149.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.149.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.149.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.15.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.15.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.15.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.150.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.150.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.150.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.151.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.151.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.151.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.152.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.152.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.152.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.153.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.153.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.153.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.154.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.154.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.154.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.155.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.155.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.155.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.156.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.156.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.156.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.157.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.157.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.157.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.158.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.158.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.158.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.159.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.159.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.159.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.16.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.16.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.16.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.160.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.160.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.160.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.161.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.161.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.161.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.162.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.162.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.162.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.163.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.163.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.163.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.164.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.164.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.164.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.165.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.165.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.165.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.166.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.166.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.166.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.167.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.167.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.167.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.168.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.168.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.168.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.169.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.169.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.169.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.17.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.17.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.17.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.170.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.170.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.170.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.171.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.171.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.171.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.172.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.172.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.172.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.173.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.173.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.173.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.174.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.174.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.174.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.175.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.175.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.175.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.176.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.176.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.176.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.177.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.177.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.177.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.178.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.178.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.178.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.179.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.179.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.179.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.18.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.18.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.18.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.180.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.180.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.180.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.181.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.181.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.181.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.182.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.182.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.182.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.183.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.183.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.183.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.184.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.184.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.184.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.185.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.185.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.185.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.186.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.186.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.186.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.187.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.187.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.187.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.188.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.188.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.188.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.189.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.189.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.189.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.19.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.19.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.19.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.190.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.190.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.190.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.191.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.191.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.191.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.192.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.192.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.192.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.193.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.193.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.193.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.194.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.194.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.194.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.195.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.195.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.195.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.196.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.196.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.196.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.197.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.197.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.197.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.198.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.198.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.198.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.199.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.199.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.199.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.2.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.2.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.2.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.20.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.20.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.20.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.200.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.200.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.200.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.201.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.201.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.201.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.202.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.202.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.202.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.203.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.203.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.203.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.204.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.204.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.204.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.205.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.205.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.205.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.206.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.206.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.206.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.207.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.207.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.207.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.208.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.208.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.208.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.209.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.209.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.209.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.21.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.21.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.21.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.210.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.210.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.210.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.211.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.211.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.211.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.212.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.212.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.212.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.213.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.213.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.213.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.214.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.214.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.214.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.215.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.215.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.215.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.216.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.216.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.216.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.217.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.217.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.217.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.218.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.218.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.218.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.219.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.219.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.219.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.22.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.22.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.22.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.220.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.220.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.220.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.221.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.221.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.221.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.222.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.222.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.222.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.223.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.223.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.223.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.224.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.224.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.224.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.225.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.225.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.225.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.226.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.226.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.226.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.227.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.227.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.227.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.228.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.228.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.228.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.229.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.229.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.229.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.23.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.23.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.23.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.230.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.230.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.230.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.231.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.231.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.231.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.232.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.232.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.232.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.233.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.233.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.233.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.234.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.234.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.234.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.235.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.235.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.235.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.236.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.236.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.236.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.237.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.237.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.237.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.238.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.238.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.238.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.239.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.239.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.239.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.24.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.24.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.24.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.240.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.240.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.240.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.241.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.241.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.241.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.242.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.242.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.242.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.243.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.243.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.243.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.244.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.244.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.244.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.245.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.245.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.245.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.246.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.246.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.246.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.247.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.247.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.247.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.248.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.248.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.248.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.249.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.249.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.249.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.25.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.25.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.25.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.250.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.250.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.250.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.251.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.251.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.251.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.252.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.252.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.252.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.253.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.253.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.253.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.254.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.254.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.254.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.255.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.255.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.255.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.26.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.26.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.26.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.27.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.27.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.27.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.28.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.28.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.28.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.29.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.29.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.29.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.3.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.3.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.3.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.30.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.30.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.30.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.31.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.31.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.31.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.32.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.32.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.32.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.33.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.33.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.33.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.34.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.34.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.34.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.35.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.35.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.35.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.36.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.36.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.36.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.37.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.37.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.37.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.38.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.38.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.38.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.39.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.39.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.39.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.4.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.4.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.4.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.40.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.40.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.40.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.41.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.41.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.41.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.42.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.42.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.42.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.43.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.43.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.43.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.44.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.44.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.44.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.45.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.45.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.45.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.46.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.46.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.46.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.47.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.47.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.47.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.48.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.48.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.48.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.49.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.49.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.49.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.5.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.5.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.5.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.50.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.50.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.50.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.51.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.51.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.51.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.52.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.52.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.52.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.53.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.53.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.53.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.54.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.54.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.54.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.55.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.55.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.55.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.56.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.56.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.56.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.57.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.57.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.57.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.58.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.58.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.58.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.59.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.59.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.59.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.6.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.6.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.6.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.60.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.60.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.60.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.61.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.61.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.61.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.62.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.62.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.62.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.63.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.63.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.63.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.64.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.64.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.64.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.65.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.65.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.65.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.66.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.66.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.66.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.67.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.67.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.67.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.68.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.68.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.68.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.69.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.69.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.69.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.7.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.7.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.7.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.70.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.70.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.70.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.71.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.71.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.71.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.72.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.72.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.72.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.73.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.73.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.73.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.74.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.74.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.74.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.75.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.75.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.75.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.76.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.76.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.76.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.77.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.77.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.77.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.78.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.78.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.78.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.79.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.79.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.79.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.8.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.8.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.8.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.80.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.80.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.80.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.81.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.81.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.81.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.82.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.82.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.82.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.83.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.83.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.83.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.84.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.84.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.84.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.85.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.85.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.85.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.86.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.86.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.86.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.87.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.87.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.87.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.88.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.88.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.88.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.89.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.89.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.89.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.9.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.9.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.9.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.90.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.90.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.90.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.91.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.91.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.91.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.92.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.92.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.92.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.93.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.93.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.93.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.94.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.94.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.94.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.95.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.95.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.95.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.96.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.96.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.96.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.97.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.97.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.97.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.98.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.98.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.98.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.99.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.99.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.experts.gate_up_proj_list.99.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.gate.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.shared_expert.down_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.shared_expert.down_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.shared_expert.down_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.shared_expert.gate_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.shared_expert.gate_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.shared_expert.gate_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.shared_expert.up_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.shared_expert.up_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.shared_expert.up_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.shared_expert_gate.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.shared_expert_gate.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.13.mlp.shared_expert_gate.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.13.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.14.input_layernorm.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.14.linear_attn.A_log": "model-00002-of-00004.safetensors", "model.language_model.layers.14.linear_attn.conv1d.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.14.linear_attn.dt_bias": "model-00002-of-00004.safetensors", "model.language_model.layers.14.linear_attn.in_proj_a.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.linear_attn.in_proj_a.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.linear_attn.in_proj_a.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.linear_attn.in_proj_b.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.linear_attn.in_proj_b.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.linear_attn.in_proj_b.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.linear_attn.in_proj_qkv.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.linear_attn.in_proj_qkv.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.linear_attn.in_proj_qkv.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.linear_attn.in_proj_z.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.linear_attn.in_proj_z.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.linear_attn.in_proj_z.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.linear_attn.norm.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.14.linear_attn.out_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.linear_attn.out_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.linear_attn.out_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.0.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.0.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.0.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.1.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.1.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.1.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.10.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.10.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.10.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.100.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.100.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.100.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.101.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.101.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.101.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.102.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.102.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.102.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.103.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.103.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.103.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.104.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.104.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.104.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.105.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.105.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.105.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.106.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.106.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.106.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.107.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.107.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.107.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.108.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.108.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.108.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.109.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.109.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.109.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.11.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.11.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.11.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.110.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.110.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.110.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.111.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.111.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.111.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.112.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.112.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.112.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.113.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.113.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.113.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.114.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.114.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.114.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.115.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.115.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.115.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.116.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.116.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.116.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.117.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.117.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.117.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.118.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.118.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.118.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.119.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.119.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.119.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.12.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.12.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.12.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.120.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.120.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.120.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.121.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.121.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.121.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.122.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.122.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.122.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.123.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.123.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.123.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.124.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.124.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.124.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.125.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.125.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.125.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.126.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.126.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.126.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.127.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.127.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.127.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.128.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.128.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.128.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.129.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.129.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.129.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.13.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.13.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.13.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.130.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.130.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.130.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.131.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.131.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.131.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.132.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.132.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.132.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.133.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.133.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.133.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.134.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.134.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.134.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.135.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.135.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.135.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.136.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.136.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.136.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.137.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.137.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.137.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.138.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.138.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.138.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.139.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.139.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.139.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.14.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.14.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.14.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.140.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.140.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.140.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.141.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.141.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.141.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.142.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.142.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.142.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.143.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.143.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.143.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.144.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.144.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.144.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.145.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.145.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.145.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.146.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.146.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.146.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.147.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.147.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.147.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.148.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.148.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.148.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.149.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.149.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.149.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.15.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.15.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.15.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.150.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.150.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.150.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.151.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.151.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.151.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.152.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.152.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.152.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.153.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.153.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.153.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.154.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.154.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.154.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.155.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.155.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.155.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.156.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.156.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.156.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.157.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.157.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.157.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.158.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.158.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.158.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.159.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.159.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.159.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.16.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.16.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.16.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.160.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.160.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.160.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.161.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.161.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.161.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.162.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.162.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.162.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.163.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.163.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.163.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.164.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.164.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.164.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.165.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.165.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.165.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.166.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.166.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.166.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.167.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.167.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.167.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.168.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.168.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.168.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.169.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.169.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.169.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.17.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.17.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.17.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.170.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.170.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.170.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.171.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.171.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.171.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.172.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.172.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.172.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.173.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.173.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.173.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.174.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.174.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.174.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.175.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.175.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.175.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.176.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.176.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.176.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.177.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.177.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.177.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.178.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.178.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.178.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.179.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.179.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.179.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.18.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.18.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.18.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.180.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.180.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.180.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.181.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.181.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.181.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.182.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.182.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.182.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.183.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.183.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.183.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.184.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.184.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.184.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.185.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.185.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.185.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.186.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.186.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.186.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.187.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.187.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.187.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.188.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.188.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.188.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.189.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.189.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.189.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.19.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.19.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.19.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.190.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.190.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.190.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.191.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.191.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.191.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.192.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.192.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.192.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.193.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.193.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.193.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.194.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.194.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.194.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.195.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.195.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.195.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.196.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.196.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.196.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.197.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.197.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.197.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.198.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.198.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.198.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.199.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.199.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.199.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.2.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.2.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.2.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.20.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.20.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.20.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.200.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.200.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.200.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.201.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.201.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.201.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.202.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.202.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.202.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.203.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.203.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.203.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.204.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.204.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.204.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.205.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.205.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.205.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.206.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.206.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.206.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.207.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.207.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.207.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.208.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.208.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.208.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.209.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.209.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.209.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.21.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.21.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.21.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.210.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.210.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.210.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.211.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.211.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.211.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.212.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.212.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.212.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.213.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.213.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.213.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.214.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.214.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.214.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.215.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.215.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.215.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.216.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.216.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.216.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.217.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.217.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.217.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.218.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.218.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.218.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.219.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.219.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.219.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.22.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.22.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.22.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.220.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.220.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.220.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.221.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.221.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.221.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.222.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.222.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.222.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.223.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.223.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.223.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.224.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.224.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.224.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.225.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.225.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.225.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.226.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.226.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.226.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.227.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.227.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.227.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.228.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.228.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.228.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.229.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.229.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.229.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.23.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.23.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.23.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.230.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.230.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.230.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.231.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.231.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.231.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.232.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.232.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.232.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.233.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.233.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.233.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.234.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.234.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.234.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.235.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.235.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.235.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.236.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.236.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.236.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.237.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.237.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.237.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.238.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.238.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.238.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.239.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.239.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.239.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.24.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.24.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.24.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.240.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.240.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.240.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.241.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.241.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.241.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.242.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.242.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.242.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.243.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.243.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.243.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.244.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.244.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.244.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.245.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.245.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.245.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.246.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.246.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.246.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.247.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.247.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.247.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.248.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.248.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.248.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.249.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.249.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.249.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.25.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.25.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.25.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.250.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.250.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.250.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.251.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.251.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.251.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.252.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.252.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.252.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.253.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.253.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.253.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.254.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.254.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.254.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.255.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.255.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.255.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.26.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.26.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.26.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.27.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.27.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.27.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.28.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.28.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.28.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.29.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.29.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.29.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.3.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.3.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.3.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.30.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.30.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.30.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.31.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.31.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.31.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.32.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.32.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.32.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.33.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.33.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.33.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.34.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.34.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.34.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.35.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.35.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.35.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.36.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.36.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.36.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.37.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.37.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.37.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.38.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.38.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.38.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.39.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.39.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.39.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.4.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.4.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.4.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.40.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.40.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.40.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.41.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.41.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.41.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.42.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.42.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.42.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.43.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.43.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.43.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.44.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.44.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.44.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.45.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.45.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.45.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.46.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.46.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.46.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.47.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.47.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.47.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.48.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.48.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.48.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.49.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.49.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.49.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.5.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.5.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.5.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.50.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.50.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.50.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.51.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.51.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.51.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.52.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.52.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.52.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.53.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.53.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.53.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.54.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.54.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.54.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.55.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.55.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.55.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.56.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.56.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.56.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.57.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.57.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.57.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.58.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.58.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.58.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.59.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.59.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.59.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.6.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.6.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.6.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.60.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.60.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.60.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.61.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.61.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.61.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.62.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.62.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.62.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.63.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.63.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.63.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.64.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.64.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.64.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.65.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.65.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.65.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.66.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.66.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.66.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.67.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.67.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.67.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.68.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.68.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.68.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.69.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.69.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.69.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.7.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.7.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.7.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.70.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.70.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.70.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.71.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.71.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.71.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.72.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.72.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.72.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.73.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.73.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.73.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.74.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.74.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.74.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.75.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.75.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.75.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.76.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.76.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.76.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.77.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.77.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.77.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.78.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.78.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.78.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.79.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.79.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.79.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.8.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.8.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.8.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.80.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.80.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.80.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.81.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.81.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.81.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.82.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.82.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.82.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.83.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.83.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.83.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.84.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.84.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.84.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.85.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.85.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.85.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.86.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.86.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.86.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.87.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.87.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.87.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.88.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.88.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.88.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.89.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.89.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.89.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.9.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.9.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.9.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.90.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.90.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.90.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.91.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.91.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.91.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.92.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.92.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.92.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.93.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.93.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.93.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.94.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.94.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.94.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.95.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.95.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.95.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.96.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.96.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.96.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.97.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.97.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.97.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.98.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.98.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.98.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.99.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.99.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.down_proj_list.99.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.0.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.0.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.0.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.1.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.1.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.1.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.10.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.10.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.10.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.100.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.100.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.100.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.101.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.101.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.101.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.102.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.102.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.102.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.103.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.103.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.103.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.104.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.104.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.104.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.105.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.105.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.105.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.106.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.106.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.106.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.107.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.107.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.107.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.108.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.108.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.108.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.109.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.109.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.109.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.11.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.11.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.11.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.110.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.110.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.110.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.111.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.111.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.111.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.112.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.112.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.112.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.113.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.113.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.113.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.114.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.114.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.114.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.115.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.115.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.115.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.116.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.116.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.116.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.117.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.117.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.117.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.118.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.118.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.118.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.119.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.119.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.119.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.12.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.12.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.12.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.120.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.120.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.120.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.121.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.121.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.121.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.122.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.122.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.122.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.123.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.123.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.123.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.124.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.124.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.124.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.125.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.125.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.125.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.126.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.126.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.126.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.127.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.127.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.127.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.128.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.128.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.128.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.129.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.129.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.129.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.13.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.13.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.13.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.130.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.130.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.130.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.131.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.131.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.131.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.132.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.132.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.132.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.133.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.133.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.133.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.134.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.134.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.134.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.135.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.135.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.135.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.136.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.136.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.136.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.137.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.137.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.137.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.138.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.138.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.138.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.139.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.139.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.139.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.14.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.14.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.14.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.140.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.140.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.140.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.141.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.141.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.141.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.142.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.142.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.142.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.143.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.143.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.143.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.144.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.144.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.144.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.145.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.145.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.145.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.146.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.146.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.146.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.147.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.147.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.147.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.148.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.148.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.148.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.149.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.149.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.149.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.15.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.15.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.15.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.150.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.150.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.150.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.151.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.151.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.151.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.152.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.152.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.152.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.153.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.153.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.153.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.154.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.154.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.154.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.155.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.155.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.155.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.156.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.156.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.156.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.157.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.157.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.157.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.158.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.158.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.158.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.159.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.159.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.159.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.16.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.16.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.16.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.160.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.160.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.160.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.161.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.161.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.161.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.162.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.162.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.162.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.163.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.163.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.163.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.164.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.164.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.164.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.165.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.165.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.165.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.166.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.166.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.166.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.167.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.167.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.167.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.168.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.168.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.168.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.169.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.169.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.169.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.17.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.17.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.17.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.170.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.170.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.170.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.171.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.171.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.171.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.172.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.172.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.172.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.173.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.173.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.173.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.174.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.174.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.174.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.175.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.175.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.175.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.176.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.176.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.176.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.177.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.177.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.177.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.178.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.178.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.178.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.179.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.179.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.179.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.18.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.18.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.18.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.180.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.180.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.180.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.181.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.181.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.181.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.182.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.182.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.182.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.183.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.183.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.183.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.184.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.184.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.184.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.185.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.185.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.185.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.186.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.186.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.186.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.187.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.187.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.187.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.188.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.188.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.188.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.189.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.189.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.189.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.19.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.19.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.19.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.190.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.190.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.190.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.191.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.191.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.191.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.192.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.192.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.192.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.193.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.193.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.193.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.194.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.194.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.194.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.195.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.195.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.195.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.196.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.196.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.196.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.197.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.197.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.197.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.198.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.198.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.198.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.199.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.199.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.199.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.2.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.2.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.2.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.20.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.20.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.20.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.200.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.200.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.200.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.201.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.201.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.201.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.202.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.202.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.202.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.203.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.203.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.203.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.204.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.204.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.204.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.205.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.205.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.205.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.206.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.206.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.206.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.207.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.207.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.207.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.208.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.208.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.208.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.209.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.209.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.209.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.21.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.21.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.21.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.210.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.210.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.210.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.211.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.211.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.211.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.212.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.212.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.212.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.213.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.213.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.213.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.214.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.214.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.214.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.215.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.215.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.215.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.216.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.216.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.216.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.217.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.217.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.217.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.218.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.218.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.218.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.219.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.219.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.219.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.22.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.22.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.22.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.220.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.220.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.220.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.221.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.221.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.221.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.222.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.222.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.222.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.223.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.223.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.223.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.224.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.224.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.224.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.225.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.225.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.225.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.226.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.226.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.226.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.227.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.227.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.227.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.228.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.228.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.228.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.229.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.229.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.229.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.23.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.23.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.23.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.230.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.230.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.230.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.231.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.231.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.231.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.232.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.232.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.232.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.233.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.233.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.233.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.234.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.234.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.234.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.235.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.235.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.235.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.236.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.236.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.236.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.237.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.237.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.237.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.238.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.238.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.238.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.239.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.239.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.239.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.24.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.24.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.24.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.240.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.240.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.240.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.241.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.241.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.241.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.242.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.242.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.242.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.243.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.243.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.243.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.244.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.244.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.244.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.245.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.245.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.245.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.246.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.246.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.246.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.247.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.247.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.247.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.248.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.248.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.248.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.249.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.249.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.249.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.25.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.25.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.25.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.250.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.250.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.250.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.251.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.251.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.251.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.252.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.252.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.252.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.253.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.253.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.253.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.254.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.254.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.254.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.255.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.255.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.255.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.26.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.26.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.26.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.27.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.27.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.27.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.28.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.28.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.28.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.29.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.29.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.29.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.3.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.3.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.3.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.30.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.30.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.30.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.31.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.31.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.31.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.32.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.32.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.32.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.33.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.33.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.33.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.34.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.34.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.34.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.35.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.35.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.35.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.36.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.36.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.36.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.37.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.37.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.37.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.38.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.38.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.38.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.39.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.39.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.39.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.4.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.4.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.4.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.40.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.40.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.40.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.41.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.41.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.41.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.42.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.42.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.42.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.43.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.43.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.43.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.44.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.44.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.44.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.45.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.45.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.45.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.46.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.46.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.46.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.47.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.47.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.47.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.48.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.48.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.48.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.49.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.49.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.49.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.5.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.5.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.5.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.50.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.50.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.50.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.51.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.51.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.51.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.52.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.52.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.52.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.53.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.53.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.53.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.54.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.54.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.54.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.55.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.55.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.55.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.56.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.56.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.56.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.57.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.57.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.57.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.58.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.58.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.58.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.59.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.59.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.59.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.6.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.6.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.6.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.60.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.60.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.60.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.61.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.61.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.61.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.62.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.62.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.62.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.63.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.63.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.63.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.64.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.64.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.64.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.65.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.65.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.65.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.66.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.66.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.66.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.67.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.67.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.67.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.68.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.68.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.68.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.69.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.69.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.69.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.7.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.7.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.7.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.70.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.70.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.70.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.71.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.71.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.71.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.72.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.72.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.72.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.73.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.73.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.73.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.74.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.74.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.74.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.75.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.75.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.75.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.76.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.76.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.76.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.77.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.77.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.77.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.78.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.78.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.78.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.79.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.79.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.79.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.8.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.8.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.8.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.80.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.80.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.80.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.81.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.81.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.81.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.82.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.82.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.82.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.83.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.83.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.83.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.84.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.84.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.84.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.85.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.85.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.85.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.86.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.86.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.86.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.87.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.87.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.87.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.88.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.88.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.88.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.89.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.89.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.89.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.9.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.9.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.9.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.90.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.90.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.90.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.91.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.91.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.91.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.92.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.92.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.92.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.93.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.93.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.93.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.94.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.94.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.94.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.95.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.95.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.95.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.96.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.96.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.96.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.97.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.97.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.97.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.98.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.98.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.98.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.99.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.99.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.experts.gate_up_proj_list.99.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.gate.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.shared_expert.down_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.shared_expert.down_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.shared_expert.down_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.shared_expert.gate_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.shared_expert.gate_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.shared_expert.gate_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.shared_expert.up_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.shared_expert.up_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.shared_expert.up_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.shared_expert_gate.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.shared_expert_gate.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.14.mlp.shared_expert_gate.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.14.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.15.input_layernorm.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.0.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.0.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.0.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.1.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.1.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.1.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.10.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.10.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.10.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.100.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.100.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.100.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.101.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.101.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.101.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.102.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.102.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.102.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.103.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.103.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.103.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.104.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.104.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.104.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.105.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.105.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.105.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.106.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.106.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.106.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.107.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.107.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.107.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.108.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.108.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.108.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.109.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.109.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.109.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.11.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.11.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.11.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.110.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.110.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.110.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.111.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.111.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.111.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.112.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.112.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.112.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.113.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.113.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.113.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.114.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.114.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.114.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.115.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.115.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.115.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.116.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.116.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.116.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.117.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.117.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.117.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.118.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.118.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.118.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.119.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.119.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.119.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.12.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.12.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.12.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.120.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.120.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.120.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.121.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.121.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.121.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.122.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.122.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.122.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.123.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.123.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.123.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.124.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.124.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.124.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.125.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.125.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.125.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.126.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.126.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.126.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.127.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.127.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.127.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.128.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.128.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.128.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.129.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.129.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.129.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.13.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.13.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.13.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.130.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.130.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.130.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.131.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.131.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.131.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.132.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.132.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.132.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.133.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.133.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.133.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.134.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.134.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.134.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.135.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.135.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.135.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.136.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.136.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.136.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.137.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.137.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.137.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.138.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.138.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.138.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.139.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.139.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.139.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.14.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.14.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.14.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.140.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.140.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.140.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.141.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.141.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.141.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.142.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.142.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.142.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.143.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.143.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.143.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.144.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.144.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.144.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.145.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.145.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.145.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.146.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.146.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.146.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.147.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.147.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.147.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.148.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.148.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.148.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.149.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.149.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.149.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.15.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.15.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.15.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.150.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.150.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.150.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.151.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.151.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.151.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.152.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.152.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.152.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.153.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.153.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.153.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.154.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.154.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.154.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.155.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.155.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.155.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.156.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.156.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.156.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.157.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.157.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.157.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.158.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.158.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.158.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.159.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.159.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.159.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.16.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.16.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.16.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.160.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.160.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.160.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.161.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.161.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.161.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.162.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.162.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.162.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.163.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.163.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.163.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.164.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.164.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.164.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.165.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.165.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.165.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.166.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.166.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.166.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.167.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.167.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.167.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.168.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.168.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.168.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.169.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.169.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.169.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.17.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.17.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.17.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.170.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.170.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.170.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.171.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.171.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.171.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.172.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.172.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.172.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.173.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.173.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.173.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.174.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.174.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.174.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.175.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.175.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.175.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.176.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.176.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.176.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.177.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.177.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.177.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.178.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.178.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.178.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.179.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.179.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.179.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.18.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.18.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.18.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.180.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.180.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.180.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.181.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.181.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.181.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.182.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.182.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.182.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.183.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.183.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.183.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.184.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.184.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.184.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.185.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.185.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.185.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.186.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.186.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.186.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.187.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.187.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.187.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.188.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.188.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.188.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.189.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.189.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.189.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.19.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.19.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.19.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.190.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.190.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.190.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.191.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.191.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.191.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.192.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.192.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.192.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.193.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.193.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.193.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.194.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.194.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.194.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.195.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.195.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.195.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.196.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.196.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.196.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.197.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.197.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.197.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.198.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.198.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.198.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.199.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.199.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.199.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.2.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.2.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.2.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.20.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.20.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.20.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.200.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.200.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.200.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.201.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.201.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.201.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.202.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.202.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.202.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.203.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.203.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.203.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.204.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.204.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.204.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.205.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.205.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.205.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.206.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.206.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.206.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.207.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.207.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.207.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.208.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.208.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.208.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.209.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.209.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.209.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.21.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.21.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.21.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.210.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.210.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.210.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.211.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.211.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.211.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.212.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.212.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.212.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.213.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.213.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.213.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.214.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.214.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.214.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.215.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.215.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.215.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.216.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.216.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.216.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.217.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.217.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.217.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.218.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.218.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.218.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.219.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.219.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.219.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.22.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.22.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.22.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.220.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.220.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.220.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.221.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.221.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.221.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.222.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.222.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.222.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.223.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.223.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.223.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.224.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.224.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.224.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.225.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.225.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.225.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.226.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.226.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.226.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.227.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.227.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.227.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.228.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.228.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.228.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.229.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.229.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.229.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.23.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.23.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.23.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.230.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.230.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.230.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.231.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.231.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.231.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.232.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.232.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.232.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.233.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.233.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.233.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.234.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.234.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.234.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.235.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.235.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.235.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.236.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.236.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.236.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.237.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.237.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.237.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.238.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.238.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.238.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.239.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.239.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.239.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.24.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.24.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.24.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.240.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.240.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.240.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.241.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.241.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.241.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.242.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.242.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.242.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.243.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.243.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.243.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.244.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.244.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.244.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.245.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.245.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.245.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.246.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.246.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.246.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.247.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.247.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.247.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.248.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.248.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.248.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.249.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.249.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.249.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.25.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.25.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.25.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.250.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.250.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.250.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.251.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.251.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.251.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.252.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.252.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.252.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.253.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.253.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.253.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.254.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.254.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.254.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.255.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.255.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.255.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.26.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.26.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.26.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.27.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.27.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.27.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.28.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.28.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.28.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.29.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.29.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.29.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.3.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.3.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.3.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.30.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.30.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.30.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.31.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.31.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.31.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.32.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.32.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.32.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.33.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.33.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.33.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.34.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.34.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.34.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.35.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.35.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.35.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.36.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.36.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.36.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.37.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.37.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.37.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.38.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.38.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.38.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.39.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.39.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.39.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.4.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.4.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.4.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.40.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.40.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.40.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.41.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.41.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.41.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.42.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.42.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.42.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.43.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.43.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.43.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.44.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.44.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.44.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.45.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.45.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.45.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.46.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.46.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.46.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.47.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.47.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.47.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.48.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.48.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.48.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.49.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.49.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.49.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.5.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.5.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.5.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.50.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.50.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.50.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.51.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.51.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.51.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.52.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.52.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.52.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.53.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.53.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.53.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.54.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.54.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.54.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.55.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.55.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.55.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.56.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.56.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.56.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.57.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.57.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.57.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.58.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.58.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.58.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.59.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.59.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.59.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.6.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.6.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.6.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.60.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.60.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.60.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.61.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.61.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.61.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.62.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.62.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.62.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.63.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.63.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.63.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.64.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.64.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.64.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.65.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.65.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.65.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.66.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.66.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.66.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.67.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.67.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.67.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.68.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.68.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.68.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.69.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.69.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.69.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.7.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.7.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.7.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.70.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.70.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.70.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.71.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.71.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.71.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.72.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.72.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.72.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.73.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.73.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.73.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.74.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.74.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.74.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.75.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.75.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.75.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.76.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.76.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.76.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.77.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.77.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.77.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.78.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.78.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.78.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.79.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.79.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.79.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.8.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.8.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.8.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.80.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.80.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.80.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.81.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.81.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.81.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.82.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.82.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.82.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.83.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.83.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.83.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.84.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.84.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.84.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.85.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.85.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.85.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.86.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.86.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.86.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.87.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.87.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.87.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.88.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.88.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.88.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.89.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.89.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.89.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.9.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.9.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.9.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.90.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.90.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.90.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.91.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.91.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.91.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.92.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.92.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.92.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.93.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.93.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.93.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.94.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.94.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.94.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.95.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.95.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.95.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.96.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.96.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.96.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.97.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.97.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.97.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.98.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.98.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.98.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.99.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.99.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.down_proj_list.99.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.0.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.0.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.0.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.1.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.1.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.1.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.10.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.10.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.10.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.100.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.100.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.100.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.101.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.101.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.101.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.102.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.102.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.102.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.103.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.103.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.103.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.104.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.104.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.104.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.105.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.105.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.105.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.106.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.106.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.106.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.107.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.107.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.107.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.108.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.108.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.108.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.109.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.109.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.109.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.11.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.11.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.11.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.110.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.110.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.110.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.111.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.111.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.111.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.112.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.112.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.112.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.113.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.113.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.113.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.114.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.114.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.114.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.115.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.115.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.115.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.116.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.116.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.116.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.117.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.117.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.117.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.118.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.118.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.118.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.119.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.119.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.119.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.12.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.12.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.12.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.120.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.120.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.120.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.121.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.121.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.121.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.122.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.122.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.122.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.123.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.123.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.123.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.124.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.124.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.124.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.125.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.125.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.125.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.126.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.126.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.126.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.127.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.127.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.127.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.128.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.128.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.128.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.129.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.129.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.129.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.13.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.13.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.13.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.130.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.130.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.130.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.131.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.131.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.131.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.132.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.132.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.132.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.133.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.133.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.133.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.134.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.134.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.134.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.135.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.135.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.135.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.136.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.136.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.136.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.137.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.137.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.137.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.138.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.138.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.138.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.139.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.139.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.139.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.14.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.14.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.14.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.140.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.140.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.140.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.141.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.141.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.141.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.142.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.142.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.142.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.143.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.143.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.143.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.144.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.144.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.144.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.145.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.145.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.145.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.146.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.146.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.146.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.147.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.147.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.147.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.148.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.148.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.148.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.149.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.149.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.149.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.15.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.15.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.15.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.150.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.150.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.150.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.151.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.151.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.151.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.152.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.152.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.152.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.153.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.153.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.153.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.154.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.154.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.154.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.155.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.155.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.155.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.156.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.156.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.156.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.157.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.157.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.157.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.158.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.158.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.158.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.159.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.159.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.159.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.16.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.16.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.16.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.160.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.160.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.160.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.161.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.161.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.161.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.162.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.162.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.162.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.163.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.163.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.163.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.164.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.164.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.164.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.165.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.165.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.165.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.166.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.166.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.166.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.167.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.167.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.167.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.168.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.168.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.168.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.169.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.169.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.169.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.17.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.17.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.17.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.170.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.170.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.170.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.171.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.171.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.171.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.172.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.172.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.172.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.173.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.173.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.173.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.174.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.174.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.174.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.175.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.175.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.175.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.176.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.176.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.176.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.177.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.177.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.177.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.178.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.178.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.178.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.179.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.179.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.179.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.18.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.18.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.18.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.180.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.180.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.180.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.181.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.181.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.181.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.182.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.182.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.182.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.183.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.183.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.183.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.184.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.184.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.184.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.185.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.185.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.185.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.186.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.186.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.186.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.187.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.187.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.187.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.188.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.188.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.188.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.189.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.189.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.189.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.19.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.19.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.19.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.190.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.190.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.190.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.191.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.191.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.191.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.192.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.192.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.192.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.193.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.193.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.193.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.194.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.194.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.194.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.195.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.195.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.195.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.196.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.196.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.196.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.197.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.197.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.197.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.198.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.198.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.198.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.199.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.199.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.199.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.2.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.2.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.2.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.20.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.20.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.20.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.200.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.200.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.200.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.201.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.201.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.201.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.202.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.202.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.202.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.203.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.203.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.203.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.204.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.204.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.204.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.205.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.205.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.205.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.206.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.206.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.206.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.207.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.207.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.207.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.208.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.208.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.208.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.209.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.209.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.209.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.21.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.21.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.21.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.210.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.210.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.210.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.211.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.211.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.211.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.212.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.212.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.212.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.213.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.213.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.213.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.214.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.214.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.214.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.215.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.215.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.215.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.216.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.216.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.216.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.217.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.217.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.217.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.218.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.218.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.218.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.219.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.219.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.219.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.22.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.22.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.22.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.220.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.220.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.220.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.221.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.221.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.221.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.222.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.222.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.222.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.223.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.223.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.223.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.224.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.224.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.224.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.225.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.225.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.225.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.226.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.226.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.226.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.227.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.227.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.227.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.228.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.228.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.228.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.229.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.229.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.229.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.23.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.23.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.23.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.230.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.230.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.230.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.231.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.231.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.231.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.232.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.232.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.232.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.233.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.233.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.233.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.234.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.234.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.234.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.235.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.235.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.235.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.236.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.236.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.236.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.237.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.237.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.237.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.238.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.238.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.238.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.239.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.239.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.239.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.24.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.24.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.24.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.240.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.240.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.240.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.241.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.241.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.241.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.242.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.242.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.242.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.243.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.243.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.243.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.244.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.244.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.244.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.245.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.245.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.245.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.246.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.246.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.246.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.247.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.247.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.247.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.248.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.248.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.248.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.249.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.249.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.249.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.25.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.25.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.25.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.250.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.250.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.250.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.251.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.251.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.251.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.252.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.252.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.252.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.253.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.253.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.253.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.254.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.254.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.254.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.255.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.255.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.255.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.26.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.26.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.26.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.27.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.27.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.27.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.28.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.28.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.28.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.29.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.29.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.29.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.3.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.3.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.3.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.30.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.30.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.30.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.31.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.31.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.31.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.32.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.32.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.32.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.33.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.33.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.33.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.34.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.34.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.34.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.35.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.35.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.35.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.36.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.36.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.36.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.37.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.37.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.37.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.38.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.38.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.38.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.39.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.39.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.39.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.4.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.4.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.4.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.40.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.40.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.40.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.41.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.41.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.41.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.42.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.42.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.42.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.43.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.43.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.43.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.44.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.44.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.44.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.45.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.45.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.45.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.46.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.46.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.46.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.47.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.47.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.47.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.48.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.48.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.48.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.49.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.49.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.49.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.5.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.5.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.5.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.50.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.50.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.50.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.51.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.51.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.51.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.52.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.52.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.52.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.53.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.53.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.53.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.54.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.54.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.54.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.55.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.55.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.55.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.56.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.56.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.56.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.57.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.57.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.57.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.58.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.58.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.58.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.59.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.59.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.59.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.6.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.6.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.6.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.60.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.60.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.60.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.61.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.61.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.61.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.62.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.62.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.62.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.63.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.63.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.63.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.64.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.64.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.64.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.65.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.65.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.65.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.66.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.66.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.66.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.67.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.67.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.67.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.68.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.68.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.68.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.69.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.69.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.69.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.7.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.7.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.7.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.70.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.70.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.70.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.71.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.71.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.71.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.72.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.72.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.72.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.73.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.73.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.73.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.74.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.74.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.74.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.75.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.75.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.75.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.76.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.76.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.76.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.77.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.77.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.77.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.78.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.78.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.78.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.79.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.79.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.79.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.8.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.8.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.8.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.80.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.80.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.80.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.81.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.81.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.81.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.82.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.82.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.82.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.83.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.83.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.83.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.84.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.84.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.84.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.85.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.85.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.85.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.86.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.86.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.86.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.87.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.87.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.87.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.88.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.88.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.88.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.89.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.89.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.89.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.9.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.9.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.9.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.90.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.90.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.90.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.91.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.91.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.91.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.92.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.92.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.92.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.93.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.93.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.93.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.94.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.94.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.94.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.95.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.95.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.95.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.96.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.96.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.96.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.97.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.97.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.97.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.98.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.98.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.98.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.99.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.99.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.experts.gate_up_proj_list.99.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.gate.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.shared_expert.down_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.shared_expert.down_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.shared_expert.down_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.shared_expert.gate_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.shared_expert.gate_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.shared_expert.gate_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.shared_expert.up_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.shared_expert.up_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.shared_expert.up_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.shared_expert_gate.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.shared_expert_gate.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.mlp.shared_expert_gate.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.15.self_attn.k_norm.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.15.self_attn.k_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.self_attn.k_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.self_attn.k_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.self_attn.o_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.self_attn.o_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.self_attn.o_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.self_attn.q_norm.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.15.self_attn.q_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.self_attn.q_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.self_attn.q_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.15.self_attn.v_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.15.self_attn.v_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.15.self_attn.v_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.input_layernorm.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.16.linear_attn.A_log": "model-00002-of-00004.safetensors", "model.language_model.layers.16.linear_attn.conv1d.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.16.linear_attn.dt_bias": "model-00002-of-00004.safetensors", "model.language_model.layers.16.linear_attn.in_proj_a.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.linear_attn.in_proj_a.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.linear_attn.in_proj_a.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.linear_attn.in_proj_b.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.linear_attn.in_proj_b.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.linear_attn.in_proj_b.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.linear_attn.in_proj_qkv.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.linear_attn.in_proj_qkv.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.linear_attn.in_proj_qkv.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.linear_attn.in_proj_z.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.linear_attn.in_proj_z.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.linear_attn.in_proj_z.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.linear_attn.norm.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.16.linear_attn.out_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.linear_attn.out_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.linear_attn.out_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.0.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.0.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.0.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.1.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.1.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.1.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.10.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.10.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.10.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.100.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.100.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.100.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.101.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.101.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.101.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.102.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.102.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.102.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.103.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.103.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.103.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.104.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.104.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.104.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.105.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.105.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.105.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.106.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.106.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.106.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.107.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.107.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.107.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.108.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.108.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.108.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.109.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.109.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.109.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.11.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.11.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.11.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.110.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.110.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.110.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.111.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.111.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.111.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.112.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.112.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.112.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.113.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.113.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.113.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.114.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.114.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.114.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.115.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.115.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.115.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.116.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.116.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.116.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.117.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.117.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.117.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.118.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.118.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.118.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.119.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.119.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.119.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.12.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.12.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.12.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.120.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.120.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.120.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.121.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.121.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.121.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.122.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.122.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.122.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.123.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.123.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.123.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.124.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.124.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.124.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.125.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.125.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.125.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.126.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.126.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.126.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.127.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.127.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.127.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.128.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.128.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.128.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.129.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.129.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.129.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.13.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.13.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.13.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.130.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.130.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.130.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.131.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.131.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.131.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.132.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.132.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.132.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.133.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.133.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.133.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.134.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.134.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.134.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.135.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.135.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.135.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.136.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.136.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.136.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.137.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.137.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.137.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.138.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.138.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.138.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.139.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.139.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.139.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.14.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.14.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.14.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.140.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.140.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.140.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.141.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.141.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.141.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.142.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.142.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.142.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.143.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.143.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.143.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.144.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.144.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.144.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.145.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.145.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.145.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.146.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.146.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.146.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.147.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.147.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.147.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.148.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.148.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.148.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.149.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.149.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.149.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.15.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.15.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.15.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.150.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.150.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.150.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.151.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.151.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.151.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.152.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.152.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.152.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.153.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.153.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.153.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.154.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.154.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.154.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.155.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.155.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.155.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.156.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.156.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.156.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.157.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.157.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.157.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.158.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.158.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.158.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.159.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.159.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.159.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.16.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.16.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.16.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.160.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.160.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.160.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.161.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.161.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.161.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.162.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.162.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.162.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.163.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.163.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.163.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.164.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.164.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.164.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.165.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.165.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.165.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.166.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.166.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.166.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.167.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.167.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.167.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.168.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.168.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.168.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.169.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.169.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.169.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.17.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.17.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.17.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.170.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.170.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.170.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.171.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.171.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.171.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.172.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.172.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.172.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.173.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.173.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.173.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.174.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.174.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.174.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.175.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.175.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.175.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.176.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.176.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.176.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.177.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.177.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.177.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.178.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.178.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.178.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.179.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.179.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.179.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.18.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.18.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.18.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.180.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.180.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.180.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.181.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.181.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.181.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.182.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.182.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.182.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.183.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.183.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.183.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.184.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.184.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.184.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.185.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.185.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.185.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.186.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.186.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.186.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.187.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.187.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.187.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.188.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.188.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.188.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.189.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.189.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.189.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.19.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.19.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.19.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.190.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.190.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.190.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.191.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.191.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.191.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.192.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.192.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.192.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.193.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.193.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.193.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.194.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.194.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.194.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.195.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.195.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.195.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.196.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.196.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.196.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.197.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.197.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.197.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.198.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.198.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.198.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.199.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.199.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.199.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.2.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.2.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.2.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.20.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.20.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.20.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.200.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.200.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.200.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.201.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.201.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.201.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.202.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.202.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.202.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.203.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.203.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.203.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.204.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.204.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.204.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.205.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.205.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.205.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.206.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.206.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.206.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.207.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.207.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.207.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.208.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.208.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.208.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.209.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.209.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.209.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.21.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.21.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.21.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.210.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.210.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.210.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.211.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.211.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.211.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.212.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.212.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.212.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.213.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.213.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.213.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.214.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.214.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.214.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.215.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.215.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.215.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.216.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.216.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.216.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.217.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.217.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.217.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.218.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.218.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.218.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.219.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.219.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.219.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.22.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.22.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.22.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.220.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.220.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.220.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.221.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.221.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.221.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.222.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.222.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.222.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.223.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.223.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.223.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.224.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.224.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.224.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.225.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.225.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.225.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.226.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.226.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.226.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.227.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.227.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.227.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.228.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.228.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.228.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.229.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.229.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.229.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.23.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.23.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.23.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.230.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.230.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.230.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.231.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.231.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.231.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.232.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.232.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.232.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.233.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.233.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.233.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.234.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.234.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.234.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.235.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.235.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.235.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.236.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.236.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.236.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.237.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.237.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.237.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.238.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.238.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.238.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.239.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.239.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.239.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.24.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.24.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.24.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.240.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.240.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.240.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.241.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.241.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.241.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.242.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.242.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.242.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.243.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.243.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.243.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.244.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.244.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.244.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.245.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.245.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.245.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.246.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.246.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.246.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.247.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.247.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.247.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.248.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.248.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.248.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.249.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.249.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.249.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.25.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.25.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.25.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.250.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.250.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.250.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.251.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.251.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.251.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.252.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.252.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.252.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.253.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.253.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.253.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.254.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.254.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.254.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.255.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.255.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.255.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.26.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.26.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.26.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.27.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.27.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.27.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.28.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.28.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.28.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.29.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.29.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.29.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.3.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.3.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.3.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.30.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.30.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.30.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.31.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.31.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.31.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.32.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.32.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.32.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.33.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.33.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.33.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.34.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.34.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.34.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.35.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.35.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.35.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.36.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.36.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.36.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.37.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.37.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.37.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.38.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.38.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.38.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.39.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.39.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.39.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.4.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.4.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.4.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.40.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.40.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.40.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.41.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.41.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.41.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.42.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.42.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.42.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.43.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.43.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.43.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.44.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.44.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.44.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.45.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.45.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.45.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.46.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.46.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.46.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.47.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.47.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.47.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.48.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.48.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.48.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.49.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.49.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.49.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.5.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.5.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.5.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.50.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.50.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.50.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.51.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.51.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.51.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.52.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.52.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.52.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.53.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.53.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.53.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.54.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.54.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.54.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.55.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.55.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.55.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.56.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.56.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.56.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.57.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.57.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.57.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.58.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.58.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.58.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.59.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.59.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.59.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.6.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.6.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.6.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.60.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.60.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.60.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.61.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.61.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.61.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.62.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.62.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.62.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.63.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.63.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.63.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.64.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.64.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.64.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.65.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.65.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.65.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.66.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.66.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.66.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.67.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.67.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.67.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.68.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.68.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.68.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.69.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.69.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.69.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.7.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.7.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.7.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.70.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.70.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.70.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.71.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.71.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.71.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.72.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.72.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.72.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.73.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.73.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.73.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.74.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.74.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.74.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.75.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.75.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.75.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.76.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.76.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.76.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.77.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.77.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.77.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.78.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.78.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.78.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.79.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.79.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.79.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.8.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.8.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.8.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.80.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.80.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.80.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.81.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.81.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.81.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.82.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.82.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.82.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.83.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.83.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.83.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.84.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.84.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.84.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.85.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.85.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.85.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.86.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.86.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.86.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.87.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.87.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.87.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.88.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.88.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.88.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.89.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.89.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.89.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.9.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.9.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.9.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.90.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.90.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.90.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.91.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.91.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.91.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.92.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.92.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.92.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.93.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.93.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.93.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.94.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.94.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.94.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.95.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.95.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.95.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.96.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.96.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.96.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.97.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.97.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.97.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.98.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.98.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.98.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.99.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.99.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.down_proj_list.99.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.0.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.0.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.0.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.1.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.1.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.1.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.10.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.10.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.10.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.100.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.100.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.100.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.101.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.101.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.101.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.102.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.102.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.102.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.103.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.103.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.103.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.104.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.104.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.104.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.105.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.105.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.105.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.106.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.106.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.106.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.107.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.107.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.107.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.108.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.108.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.108.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.109.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.109.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.109.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.11.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.11.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.11.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.110.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.110.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.110.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.111.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.111.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.111.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.112.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.112.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.112.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.113.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.113.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.113.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.114.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.114.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.114.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.115.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.115.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.115.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.116.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.116.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.116.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.117.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.117.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.117.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.118.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.118.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.118.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.119.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.119.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.119.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.12.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.12.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.12.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.120.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.120.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.120.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.121.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.121.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.121.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.122.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.122.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.122.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.123.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.123.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.123.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.124.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.124.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.124.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.125.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.125.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.125.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.126.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.126.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.126.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.127.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.127.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.127.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.128.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.128.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.128.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.129.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.129.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.129.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.13.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.13.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.13.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.130.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.130.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.130.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.131.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.131.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.131.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.132.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.132.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.132.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.133.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.133.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.133.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.134.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.134.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.134.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.135.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.135.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.135.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.136.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.136.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.136.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.137.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.137.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.137.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.138.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.138.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.138.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.139.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.139.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.139.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.14.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.14.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.14.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.140.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.140.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.140.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.141.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.141.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.141.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.142.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.142.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.142.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.143.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.143.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.143.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.144.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.144.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.144.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.145.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.145.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.145.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.146.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.146.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.146.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.147.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.147.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.147.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.148.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.148.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.148.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.149.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.149.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.149.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.15.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.15.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.15.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.150.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.150.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.150.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.151.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.151.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.151.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.152.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.152.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.152.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.153.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.153.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.153.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.154.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.154.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.154.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.155.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.155.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.155.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.156.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.156.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.156.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.157.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.157.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.157.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.158.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.158.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.158.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.159.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.159.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.159.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.16.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.16.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.16.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.160.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.160.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.160.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.161.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.161.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.161.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.162.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.162.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.162.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.163.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.163.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.163.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.164.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.164.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.164.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.165.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.165.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.165.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.166.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.166.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.166.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.167.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.167.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.167.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.168.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.168.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.168.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.169.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.169.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.169.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.17.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.17.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.17.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.170.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.170.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.170.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.171.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.171.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.171.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.172.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.172.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.172.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.173.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.173.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.173.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.174.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.174.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.174.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.175.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.175.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.175.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.176.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.176.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.176.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.177.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.177.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.177.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.178.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.178.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.178.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.179.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.179.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.179.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.18.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.18.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.18.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.180.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.180.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.180.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.181.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.181.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.181.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.182.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.182.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.182.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.183.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.183.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.183.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.184.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.184.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.184.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.185.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.185.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.185.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.186.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.186.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.186.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.187.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.187.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.187.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.188.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.188.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.188.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.189.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.189.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.189.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.19.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.19.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.19.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.190.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.190.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.190.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.191.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.191.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.191.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.192.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.192.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.192.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.193.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.193.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.193.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.194.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.194.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.194.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.195.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.195.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.195.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.196.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.196.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.196.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.197.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.197.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.197.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.198.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.198.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.198.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.199.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.199.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.199.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.2.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.2.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.2.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.20.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.20.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.20.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.200.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.200.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.200.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.201.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.201.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.201.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.202.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.202.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.202.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.203.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.203.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.203.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.204.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.204.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.204.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.205.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.205.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.205.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.206.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.206.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.206.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.207.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.207.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.207.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.208.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.208.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.208.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.209.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.209.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.209.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.21.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.21.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.21.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.210.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.210.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.210.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.211.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.211.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.211.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.212.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.212.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.212.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.213.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.213.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.213.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.214.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.214.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.214.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.215.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.215.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.215.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.216.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.216.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.216.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.217.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.217.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.217.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.218.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.218.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.218.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.219.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.219.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.219.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.22.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.22.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.22.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.220.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.220.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.220.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.221.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.221.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.221.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.222.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.222.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.222.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.223.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.223.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.223.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.224.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.224.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.224.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.225.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.225.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.225.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.226.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.226.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.226.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.227.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.227.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.227.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.228.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.228.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.228.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.229.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.229.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.229.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.23.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.23.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.23.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.230.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.230.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.230.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.231.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.231.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.231.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.232.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.232.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.232.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.233.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.233.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.233.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.234.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.234.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.234.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.235.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.235.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.235.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.236.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.236.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.236.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.237.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.237.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.237.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.238.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.238.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.238.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.239.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.239.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.239.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.24.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.24.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.24.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.240.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.240.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.240.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.241.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.241.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.241.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.242.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.242.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.242.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.243.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.243.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.243.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.244.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.244.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.244.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.245.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.245.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.245.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.246.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.246.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.246.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.247.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.247.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.247.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.248.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.248.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.248.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.249.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.249.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.249.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.25.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.25.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.25.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.250.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.250.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.250.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.251.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.251.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.251.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.252.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.252.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.252.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.253.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.253.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.253.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.254.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.254.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.254.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.255.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.255.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.255.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.26.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.26.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.26.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.27.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.27.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.27.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.28.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.28.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.28.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.29.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.29.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.29.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.3.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.3.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.3.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.30.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.30.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.30.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.31.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.31.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.31.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.32.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.32.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.32.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.33.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.33.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.33.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.34.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.34.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.34.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.35.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.35.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.35.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.36.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.36.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.36.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.37.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.37.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.37.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.38.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.38.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.38.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.39.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.39.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.39.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.4.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.4.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.4.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.40.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.40.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.40.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.41.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.41.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.41.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.42.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.42.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.42.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.43.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.43.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.43.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.44.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.44.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.44.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.45.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.45.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.45.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.46.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.46.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.46.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.47.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.47.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.47.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.48.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.48.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.48.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.49.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.49.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.49.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.5.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.5.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.5.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.50.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.50.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.50.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.51.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.51.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.51.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.52.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.52.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.52.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.53.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.53.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.53.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.54.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.54.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.54.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.55.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.55.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.55.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.56.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.56.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.56.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.57.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.57.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.57.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.58.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.58.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.58.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.59.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.59.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.59.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.6.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.6.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.6.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.60.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.60.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.60.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.61.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.61.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.61.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.62.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.62.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.62.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.63.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.63.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.63.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.64.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.64.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.64.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.65.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.65.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.65.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.66.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.66.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.66.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.67.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.67.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.67.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.68.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.68.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.68.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.69.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.69.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.69.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.7.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.7.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.7.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.70.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.70.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.70.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.71.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.71.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.71.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.72.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.72.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.72.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.73.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.73.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.73.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.74.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.74.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.74.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.75.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.75.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.75.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.76.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.76.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.76.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.77.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.77.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.77.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.78.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.78.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.78.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.79.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.79.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.79.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.8.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.8.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.8.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.80.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.80.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.80.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.81.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.81.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.81.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.82.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.82.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.82.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.83.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.83.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.83.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.84.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.84.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.84.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.85.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.85.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.85.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.86.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.86.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.86.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.87.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.87.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.87.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.88.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.88.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.88.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.89.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.89.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.89.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.9.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.9.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.9.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.90.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.90.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.90.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.91.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.91.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.91.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.92.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.92.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.92.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.93.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.93.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.93.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.94.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.94.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.94.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.95.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.95.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.95.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.96.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.96.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.96.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.97.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.97.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.97.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.98.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.98.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.98.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.99.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.99.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.experts.gate_up_proj_list.99.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.gate.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.shared_expert.down_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.shared_expert.down_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.shared_expert.down_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.shared_expert.gate_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.shared_expert.gate_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.shared_expert.gate_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.shared_expert.up_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.shared_expert.up_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.shared_expert.up_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.shared_expert_gate.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.shared_expert_gate.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.16.mlp.shared_expert_gate.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.16.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.17.input_layernorm.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.17.linear_attn.A_log": "model-00002-of-00004.safetensors", "model.language_model.layers.17.linear_attn.conv1d.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.17.linear_attn.dt_bias": "model-00002-of-00004.safetensors", "model.language_model.layers.17.linear_attn.in_proj_a.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.linear_attn.in_proj_a.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.linear_attn.in_proj_a.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.linear_attn.in_proj_b.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.linear_attn.in_proj_b.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.linear_attn.in_proj_b.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.linear_attn.in_proj_qkv.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.linear_attn.in_proj_qkv.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.linear_attn.in_proj_qkv.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.linear_attn.in_proj_z.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.linear_attn.in_proj_z.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.linear_attn.in_proj_z.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.linear_attn.norm.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.17.linear_attn.out_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.linear_attn.out_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.linear_attn.out_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.0.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.0.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.0.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.1.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.1.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.1.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.10.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.10.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.10.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.100.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.100.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.100.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.101.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.101.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.101.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.102.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.102.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.102.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.103.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.103.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.103.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.104.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.104.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.104.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.105.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.105.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.105.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.106.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.106.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.106.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.107.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.107.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.107.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.108.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.108.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.108.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.109.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.109.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.109.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.11.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.11.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.11.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.110.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.110.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.110.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.111.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.111.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.111.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.112.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.112.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.112.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.113.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.113.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.113.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.114.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.114.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.114.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.115.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.115.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.115.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.116.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.116.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.116.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.117.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.117.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.117.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.118.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.118.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.118.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.119.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.119.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.119.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.12.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.12.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.12.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.120.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.120.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.120.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.121.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.121.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.121.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.122.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.122.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.122.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.123.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.123.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.123.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.124.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.124.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.124.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.125.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.125.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.125.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.126.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.126.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.126.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.127.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.127.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.127.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.128.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.128.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.128.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.129.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.129.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.129.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.13.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.13.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.13.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.130.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.130.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.130.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.131.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.131.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.131.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.132.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.132.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.132.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.133.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.133.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.133.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.134.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.134.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.134.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.135.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.135.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.135.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.136.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.136.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.136.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.137.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.137.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.137.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.138.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.138.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.138.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.139.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.139.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.139.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.14.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.14.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.14.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.140.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.140.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.140.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.141.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.141.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.141.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.142.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.142.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.142.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.143.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.143.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.143.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.144.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.144.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.144.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.145.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.145.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.145.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.146.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.146.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.146.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.147.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.147.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.147.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.148.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.148.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.148.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.149.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.149.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.149.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.15.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.15.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.15.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.150.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.150.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.150.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.151.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.151.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.151.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.152.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.152.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.152.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.153.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.153.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.153.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.154.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.154.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.154.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.155.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.155.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.155.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.156.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.156.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.156.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.157.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.157.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.157.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.158.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.158.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.158.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.159.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.159.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.159.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.16.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.16.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.16.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.160.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.160.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.160.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.161.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.161.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.161.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.162.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.162.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.162.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.163.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.163.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.163.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.164.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.164.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.164.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.165.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.165.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.165.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.166.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.166.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.166.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.167.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.167.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.167.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.168.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.168.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.168.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.169.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.169.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.169.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.17.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.17.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.17.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.170.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.170.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.170.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.171.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.171.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.171.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.172.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.172.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.172.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.173.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.173.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.173.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.174.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.174.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.174.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.175.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.175.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.175.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.176.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.176.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.176.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.177.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.177.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.177.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.178.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.178.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.178.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.179.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.179.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.179.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.18.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.18.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.18.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.180.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.180.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.180.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.181.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.181.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.181.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.182.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.182.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.182.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.183.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.183.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.183.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.184.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.184.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.184.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.185.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.185.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.185.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.186.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.186.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.186.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.187.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.187.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.187.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.188.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.188.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.188.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.189.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.189.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.189.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.19.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.19.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.19.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.190.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.190.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.190.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.191.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.191.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.191.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.192.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.192.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.192.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.193.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.193.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.193.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.194.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.194.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.194.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.195.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.195.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.195.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.196.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.196.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.196.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.197.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.197.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.197.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.198.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.198.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.198.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.199.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.199.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.199.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.2.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.2.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.2.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.20.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.20.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.20.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.200.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.200.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.200.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.201.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.201.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.201.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.202.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.202.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.202.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.203.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.203.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.203.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.204.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.204.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.204.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.205.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.205.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.205.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.206.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.206.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.206.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.207.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.207.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.207.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.208.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.208.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.208.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.209.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.209.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.209.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.21.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.21.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.21.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.210.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.210.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.210.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.211.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.211.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.211.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.212.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.212.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.212.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.213.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.213.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.213.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.214.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.214.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.214.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.215.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.215.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.215.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.216.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.216.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.216.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.217.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.217.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.217.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.218.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.218.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.218.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.219.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.219.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.219.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.22.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.22.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.22.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.220.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.220.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.220.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.221.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.221.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.221.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.222.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.222.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.222.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.223.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.223.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.223.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.224.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.224.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.224.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.225.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.225.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.225.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.226.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.226.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.226.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.227.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.227.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.227.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.228.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.228.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.228.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.229.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.229.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.229.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.23.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.23.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.23.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.230.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.230.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.230.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.231.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.231.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.231.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.232.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.232.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.232.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.233.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.233.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.233.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.234.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.234.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.234.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.235.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.235.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.235.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.236.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.236.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.236.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.237.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.237.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.237.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.238.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.238.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.238.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.239.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.239.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.239.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.24.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.24.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.24.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.240.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.240.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.240.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.241.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.241.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.241.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.242.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.242.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.242.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.243.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.243.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.243.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.244.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.244.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.244.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.245.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.245.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.245.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.246.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.246.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.246.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.247.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.247.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.247.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.248.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.248.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.248.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.249.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.249.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.249.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.25.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.25.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.25.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.250.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.250.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.250.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.251.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.251.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.251.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.252.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.252.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.252.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.253.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.253.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.253.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.254.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.254.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.254.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.255.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.255.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.255.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.26.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.26.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.26.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.27.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.27.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.27.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.28.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.28.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.28.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.29.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.29.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.29.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.3.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.3.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.3.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.30.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.30.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.30.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.31.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.31.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.31.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.32.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.32.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.32.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.33.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.33.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.33.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.34.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.34.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.34.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.35.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.35.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.35.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.36.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.36.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.36.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.37.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.37.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.37.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.38.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.38.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.38.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.39.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.39.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.39.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.4.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.4.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.4.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.40.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.40.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.40.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.41.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.41.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.41.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.42.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.42.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.42.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.43.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.43.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.43.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.44.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.44.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.44.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.45.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.45.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.45.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.46.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.46.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.46.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.47.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.47.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.47.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.48.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.48.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.48.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.49.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.49.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.49.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.5.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.5.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.5.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.50.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.50.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.50.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.51.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.51.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.51.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.52.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.52.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.52.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.53.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.53.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.53.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.54.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.54.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.54.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.55.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.55.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.55.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.56.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.56.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.56.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.57.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.57.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.57.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.58.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.58.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.58.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.59.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.59.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.59.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.6.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.6.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.6.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.60.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.60.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.60.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.61.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.61.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.61.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.62.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.62.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.62.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.63.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.63.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.63.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.64.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.64.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.64.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.65.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.65.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.65.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.66.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.66.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.66.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.67.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.67.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.67.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.68.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.68.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.68.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.69.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.69.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.69.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.7.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.7.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.7.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.70.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.70.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.70.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.71.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.71.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.71.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.72.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.72.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.72.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.73.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.73.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.73.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.74.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.74.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.74.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.75.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.75.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.75.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.76.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.76.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.76.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.77.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.77.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.77.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.78.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.78.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.78.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.79.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.79.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.79.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.8.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.8.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.8.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.80.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.80.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.80.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.81.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.81.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.81.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.82.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.82.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.82.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.83.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.83.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.83.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.84.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.84.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.84.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.85.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.85.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.85.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.86.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.86.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.86.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.87.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.87.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.87.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.88.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.88.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.88.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.89.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.89.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.89.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.9.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.9.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.9.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.90.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.90.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.90.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.91.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.91.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.91.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.92.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.92.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.92.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.93.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.93.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.93.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.94.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.94.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.94.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.95.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.95.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.95.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.96.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.96.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.96.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.97.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.97.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.97.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.98.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.98.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.98.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.99.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.99.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.down_proj_list.99.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.0.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.0.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.0.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.1.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.1.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.1.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.10.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.10.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.10.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.100.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.100.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.100.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.101.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.101.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.101.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.102.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.102.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.102.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.103.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.103.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.103.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.104.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.104.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.104.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.105.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.105.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.105.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.106.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.106.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.106.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.107.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.107.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.107.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.108.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.108.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.108.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.109.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.109.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.109.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.11.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.11.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.11.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.110.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.110.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.110.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.111.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.111.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.111.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.112.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.112.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.112.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.113.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.113.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.113.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.114.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.114.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.114.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.115.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.115.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.115.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.116.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.116.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.116.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.117.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.117.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.117.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.118.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.118.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.118.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.119.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.119.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.119.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.12.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.12.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.12.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.120.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.120.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.120.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.121.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.121.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.121.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.122.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.122.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.122.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.123.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.123.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.123.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.124.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.124.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.124.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.125.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.125.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.125.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.126.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.126.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.126.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.127.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.127.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.127.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.128.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.128.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.128.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.129.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.129.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.129.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.13.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.13.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.13.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.130.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.130.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.130.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.131.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.131.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.131.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.132.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.132.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.132.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.133.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.133.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.133.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.134.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.134.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.134.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.135.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.135.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.135.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.136.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.136.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.136.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.137.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.137.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.137.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.138.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.138.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.138.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.139.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.139.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.139.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.14.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.14.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.14.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.140.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.140.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.140.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.141.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.141.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.141.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.142.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.142.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.142.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.143.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.143.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.143.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.144.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.144.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.144.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.145.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.145.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.145.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.146.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.146.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.146.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.147.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.147.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.147.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.148.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.148.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.148.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.149.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.149.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.149.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.15.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.15.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.15.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.150.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.150.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.150.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.151.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.151.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.151.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.152.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.152.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.152.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.153.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.153.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.153.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.154.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.154.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.154.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.155.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.155.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.155.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.156.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.156.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.156.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.157.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.157.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.157.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.158.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.158.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.158.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.159.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.159.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.159.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.16.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.16.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.16.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.160.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.160.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.160.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.161.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.161.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.161.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.162.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.162.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.162.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.163.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.163.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.163.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.164.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.164.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.164.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.165.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.165.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.165.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.166.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.166.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.166.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.167.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.167.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.167.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.168.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.168.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.168.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.169.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.169.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.169.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.17.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.17.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.17.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.170.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.170.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.170.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.171.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.171.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.171.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.172.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.172.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.172.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.173.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.173.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.173.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.174.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.174.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.174.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.175.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.175.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.175.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.176.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.176.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.176.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.177.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.177.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.177.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.178.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.178.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.178.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.179.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.179.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.179.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.18.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.18.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.18.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.180.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.180.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.180.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.181.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.181.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.181.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.182.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.182.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.182.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.183.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.183.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.183.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.184.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.184.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.184.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.185.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.185.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.185.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.186.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.186.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.186.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.187.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.187.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.187.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.188.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.188.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.188.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.189.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.189.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.189.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.19.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.19.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.19.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.190.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.190.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.190.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.191.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.191.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.191.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.192.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.192.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.192.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.193.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.193.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.193.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.194.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.194.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.194.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.195.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.195.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.195.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.196.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.196.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.196.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.197.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.197.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.197.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.198.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.198.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.198.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.199.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.199.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.199.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.2.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.2.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.2.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.20.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.20.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.20.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.200.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.200.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.200.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.201.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.201.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.201.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.202.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.202.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.202.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.203.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.203.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.203.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.204.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.204.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.204.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.205.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.205.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.205.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.206.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.206.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.206.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.207.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.207.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.207.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.208.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.208.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.208.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.209.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.209.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.209.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.21.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.21.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.21.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.210.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.210.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.210.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.211.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.211.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.211.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.212.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.212.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.212.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.213.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.213.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.213.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.214.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.214.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.214.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.215.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.215.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.215.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.216.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.216.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.216.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.217.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.217.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.217.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.218.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.218.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.218.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.219.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.219.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.219.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.22.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.22.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.22.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.220.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.220.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.220.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.221.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.221.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.221.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.222.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.222.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.222.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.223.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.223.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.223.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.224.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.224.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.224.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.225.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.225.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.225.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.226.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.226.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.226.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.227.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.227.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.227.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.228.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.228.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.228.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.229.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.229.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.229.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.23.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.23.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.23.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.230.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.230.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.230.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.231.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.231.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.231.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.232.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.232.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.232.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.233.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.233.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.233.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.234.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.234.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.234.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.235.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.235.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.235.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.236.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.236.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.236.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.237.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.237.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.237.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.238.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.238.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.238.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.239.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.239.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.239.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.24.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.24.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.24.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.240.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.240.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.240.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.241.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.241.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.241.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.242.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.242.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.242.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.243.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.243.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.243.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.244.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.244.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.244.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.245.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.245.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.245.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.246.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.246.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.246.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.247.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.247.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.247.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.248.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.248.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.248.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.249.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.249.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.249.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.25.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.25.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.25.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.250.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.250.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.250.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.251.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.251.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.251.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.252.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.252.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.252.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.253.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.253.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.253.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.254.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.254.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.254.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.255.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.255.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.255.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.26.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.26.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.26.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.27.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.27.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.27.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.28.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.28.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.28.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.29.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.29.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.29.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.3.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.3.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.3.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.30.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.30.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.30.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.31.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.31.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.31.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.32.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.32.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.32.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.33.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.33.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.33.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.34.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.34.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.34.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.35.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.35.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.35.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.36.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.36.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.36.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.37.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.37.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.37.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.38.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.38.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.38.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.39.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.39.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.39.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.4.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.4.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.4.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.40.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.40.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.40.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.41.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.41.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.41.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.42.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.42.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.42.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.43.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.43.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.43.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.44.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.44.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.44.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.45.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.45.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.45.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.46.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.46.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.46.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.47.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.47.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.47.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.48.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.48.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.48.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.49.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.49.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.49.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.5.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.5.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.5.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.50.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.50.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.50.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.51.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.51.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.51.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.52.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.52.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.52.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.53.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.53.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.53.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.54.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.54.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.54.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.55.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.55.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.55.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.56.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.56.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.56.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.57.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.57.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.57.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.58.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.58.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.58.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.59.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.59.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.59.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.6.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.6.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.6.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.60.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.60.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.60.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.61.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.61.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.61.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.62.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.62.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.62.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.63.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.63.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.63.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.64.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.64.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.64.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.65.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.65.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.65.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.66.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.66.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.66.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.67.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.67.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.67.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.68.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.68.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.68.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.69.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.69.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.69.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.7.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.7.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.7.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.70.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.70.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.70.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.71.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.71.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.71.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.72.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.72.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.72.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.73.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.73.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.73.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.74.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.74.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.74.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.75.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.75.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.75.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.76.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.76.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.76.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.77.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.77.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.77.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.78.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.78.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.78.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.79.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.79.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.79.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.8.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.8.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.8.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.80.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.80.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.80.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.81.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.81.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.81.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.82.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.82.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.82.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.83.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.83.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.83.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.84.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.84.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.84.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.85.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.85.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.85.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.86.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.86.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.86.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.87.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.87.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.87.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.88.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.88.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.88.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.89.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.89.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.89.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.9.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.9.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.9.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.90.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.90.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.90.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.91.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.91.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.91.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.92.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.92.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.92.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.93.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.93.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.93.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.94.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.94.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.94.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.95.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.95.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.95.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.96.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.96.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.96.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.97.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.97.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.97.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.98.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.98.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.98.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.99.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.99.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.experts.gate_up_proj_list.99.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.gate.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.shared_expert.down_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.shared_expert.down_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.shared_expert.down_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.shared_expert.gate_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.shared_expert.gate_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.shared_expert.gate_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.shared_expert.up_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.shared_expert.up_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.shared_expert.up_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.shared_expert_gate.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.shared_expert_gate.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.17.mlp.shared_expert_gate.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.17.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.18.input_layernorm.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.18.linear_attn.A_log": "model-00002-of-00004.safetensors", "model.language_model.layers.18.linear_attn.conv1d.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.18.linear_attn.dt_bias": "model-00002-of-00004.safetensors", "model.language_model.layers.18.linear_attn.in_proj_a.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.linear_attn.in_proj_a.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.linear_attn.in_proj_a.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.linear_attn.in_proj_b.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.linear_attn.in_proj_b.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.linear_attn.in_proj_b.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.linear_attn.in_proj_qkv.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.linear_attn.in_proj_qkv.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.linear_attn.in_proj_qkv.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.linear_attn.in_proj_z.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.linear_attn.in_proj_z.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.linear_attn.in_proj_z.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.linear_attn.norm.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.18.linear_attn.out_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.linear_attn.out_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.linear_attn.out_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.0.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.0.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.0.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.1.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.1.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.1.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.10.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.10.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.10.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.100.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.100.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.100.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.101.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.101.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.101.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.102.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.102.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.102.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.103.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.103.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.103.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.104.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.104.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.104.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.105.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.105.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.105.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.106.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.106.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.106.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.107.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.107.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.107.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.108.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.108.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.108.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.109.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.109.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.109.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.11.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.11.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.11.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.110.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.110.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.110.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.111.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.111.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.111.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.112.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.112.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.112.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.113.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.113.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.113.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.114.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.114.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.114.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.115.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.115.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.115.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.116.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.116.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.116.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.117.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.117.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.117.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.118.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.118.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.118.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.119.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.119.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.119.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.12.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.12.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.12.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.120.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.120.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.120.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.121.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.121.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.121.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.122.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.122.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.122.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.123.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.123.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.123.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.124.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.124.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.124.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.125.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.125.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.125.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.126.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.126.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.126.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.127.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.127.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.127.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.128.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.128.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.128.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.129.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.129.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.129.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.13.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.13.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.13.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.130.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.130.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.130.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.131.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.131.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.131.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.132.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.132.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.132.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.133.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.133.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.133.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.134.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.134.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.134.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.135.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.135.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.135.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.136.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.136.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.136.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.137.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.137.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.137.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.138.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.138.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.138.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.139.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.139.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.139.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.14.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.14.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.14.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.140.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.140.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.140.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.141.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.141.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.141.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.142.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.142.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.142.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.143.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.143.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.143.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.144.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.144.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.144.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.145.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.145.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.145.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.146.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.146.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.146.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.147.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.147.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.147.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.148.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.148.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.148.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.149.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.149.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.149.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.15.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.15.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.15.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.150.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.150.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.150.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.151.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.151.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.151.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.152.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.152.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.152.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.153.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.153.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.153.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.154.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.154.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.154.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.155.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.155.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.155.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.156.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.156.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.156.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.157.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.157.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.157.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.158.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.158.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.158.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.159.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.159.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.159.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.16.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.16.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.16.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.160.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.160.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.160.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.161.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.161.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.161.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.162.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.162.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.162.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.163.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.163.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.163.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.164.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.164.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.164.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.165.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.165.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.165.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.166.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.166.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.166.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.167.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.167.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.167.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.168.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.168.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.168.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.169.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.169.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.169.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.17.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.17.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.17.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.170.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.170.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.170.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.171.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.171.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.171.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.172.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.172.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.172.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.173.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.173.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.173.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.174.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.174.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.174.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.175.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.175.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.175.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.176.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.176.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.176.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.177.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.177.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.177.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.178.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.178.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.178.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.179.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.179.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.179.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.18.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.18.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.18.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.180.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.180.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.180.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.181.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.181.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.181.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.182.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.182.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.182.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.183.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.183.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.183.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.184.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.184.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.184.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.185.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.185.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.185.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.186.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.186.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.186.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.187.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.187.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.187.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.188.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.188.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.188.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.189.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.189.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.189.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.19.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.19.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.19.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.190.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.190.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.190.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.191.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.191.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.191.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.192.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.192.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.192.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.193.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.193.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.193.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.194.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.194.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.194.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.195.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.195.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.195.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.196.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.196.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.196.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.197.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.197.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.197.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.198.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.198.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.198.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.199.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.199.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.199.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.2.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.2.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.2.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.20.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.20.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.20.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.200.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.200.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.200.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.201.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.201.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.201.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.202.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.202.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.202.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.203.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.203.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.203.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.204.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.204.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.204.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.205.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.205.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.205.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.206.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.206.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.206.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.207.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.207.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.207.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.208.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.208.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.208.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.209.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.209.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.209.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.21.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.21.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.21.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.210.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.210.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.210.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.211.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.211.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.211.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.212.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.212.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.212.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.213.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.213.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.213.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.214.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.214.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.214.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.215.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.215.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.215.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.216.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.216.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.216.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.217.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.217.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.217.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.218.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.218.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.218.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.219.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.219.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.219.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.22.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.22.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.22.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.220.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.220.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.220.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.221.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.221.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.221.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.222.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.222.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.222.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.223.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.223.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.223.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.224.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.224.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.224.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.225.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.225.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.225.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.226.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.226.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.226.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.227.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.227.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.227.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.228.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.228.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.228.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.229.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.229.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.229.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.23.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.23.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.23.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.230.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.230.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.230.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.231.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.231.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.231.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.232.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.232.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.232.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.233.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.233.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.233.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.234.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.234.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.234.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.235.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.235.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.235.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.236.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.236.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.236.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.237.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.237.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.237.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.238.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.238.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.238.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.239.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.239.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.239.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.24.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.24.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.24.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.240.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.240.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.240.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.241.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.241.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.241.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.242.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.242.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.242.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.243.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.243.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.243.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.244.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.244.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.244.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.245.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.245.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.245.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.246.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.246.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.246.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.247.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.247.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.247.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.248.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.248.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.248.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.249.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.249.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.249.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.25.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.25.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.25.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.250.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.250.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.250.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.251.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.251.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.251.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.252.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.252.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.252.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.253.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.253.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.253.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.254.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.254.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.254.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.255.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.255.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.255.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.26.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.26.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.26.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.27.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.27.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.27.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.28.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.28.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.28.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.29.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.29.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.29.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.3.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.3.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.3.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.30.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.30.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.30.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.31.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.31.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.31.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.32.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.32.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.32.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.33.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.33.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.33.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.34.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.34.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.34.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.35.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.35.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.35.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.36.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.36.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.36.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.37.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.37.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.37.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.38.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.38.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.38.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.39.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.39.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.39.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.4.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.4.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.4.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.40.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.40.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.40.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.41.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.41.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.41.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.42.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.42.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.42.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.43.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.43.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.43.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.44.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.44.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.44.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.45.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.45.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.45.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.46.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.46.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.46.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.47.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.47.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.47.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.48.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.48.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.48.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.49.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.49.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.49.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.5.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.5.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.5.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.50.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.50.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.50.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.51.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.51.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.51.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.52.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.52.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.52.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.53.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.53.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.53.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.54.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.54.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.54.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.55.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.55.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.55.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.56.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.56.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.56.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.57.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.57.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.57.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.58.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.58.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.58.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.59.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.59.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.59.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.6.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.6.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.6.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.60.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.60.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.60.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.61.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.61.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.61.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.62.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.62.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.62.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.63.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.63.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.63.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.64.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.64.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.64.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.65.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.65.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.65.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.66.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.66.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.66.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.67.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.67.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.67.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.68.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.68.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.68.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.69.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.69.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.69.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.7.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.7.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.7.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.70.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.70.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.70.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.71.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.71.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.71.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.72.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.72.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.72.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.73.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.73.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.73.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.74.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.74.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.74.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.75.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.75.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.75.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.76.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.76.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.76.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.77.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.77.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.77.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.78.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.78.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.78.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.79.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.79.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.79.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.8.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.8.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.8.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.80.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.80.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.80.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.81.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.81.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.81.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.82.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.82.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.82.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.83.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.83.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.83.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.84.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.84.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.84.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.85.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.85.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.85.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.86.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.86.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.86.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.87.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.87.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.87.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.88.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.88.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.88.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.89.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.89.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.89.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.9.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.9.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.9.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.90.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.90.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.90.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.91.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.91.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.91.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.92.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.92.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.92.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.93.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.93.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.93.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.94.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.94.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.94.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.95.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.95.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.95.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.96.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.96.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.96.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.97.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.97.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.97.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.98.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.98.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.98.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.99.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.99.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.down_proj_list.99.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.0.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.0.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.0.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.1.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.1.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.1.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.10.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.10.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.10.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.100.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.100.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.100.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.101.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.101.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.101.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.102.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.102.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.102.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.103.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.103.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.103.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.104.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.104.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.104.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.105.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.105.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.105.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.106.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.106.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.106.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.107.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.107.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.107.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.108.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.108.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.108.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.109.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.109.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.109.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.11.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.11.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.11.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.110.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.110.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.110.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.111.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.111.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.111.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.112.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.112.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.112.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.113.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.113.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.113.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.114.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.114.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.114.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.115.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.115.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.115.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.116.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.116.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.116.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.117.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.117.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.117.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.118.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.118.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.118.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.119.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.119.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.119.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.12.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.12.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.12.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.120.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.120.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.120.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.121.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.121.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.121.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.122.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.122.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.122.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.123.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.123.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.123.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.124.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.124.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.124.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.125.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.125.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.125.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.126.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.126.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.126.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.127.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.127.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.127.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.128.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.128.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.128.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.129.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.129.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.129.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.13.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.13.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.13.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.130.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.130.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.130.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.131.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.131.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.131.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.132.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.132.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.132.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.133.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.133.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.133.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.134.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.134.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.134.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.135.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.135.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.135.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.136.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.136.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.136.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.137.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.137.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.137.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.138.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.138.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.138.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.139.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.139.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.139.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.14.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.14.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.14.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.140.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.140.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.140.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.141.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.141.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.141.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.142.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.142.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.142.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.143.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.143.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.143.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.144.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.144.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.144.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.145.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.145.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.145.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.146.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.146.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.146.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.147.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.147.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.147.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.148.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.148.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.148.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.149.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.149.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.149.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.15.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.15.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.15.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.150.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.150.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.150.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.151.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.151.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.151.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.152.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.152.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.152.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.153.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.153.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.153.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.154.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.154.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.154.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.155.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.155.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.155.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.156.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.156.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.156.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.157.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.157.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.157.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.158.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.158.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.158.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.159.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.159.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.159.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.16.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.16.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.16.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.160.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.160.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.160.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.161.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.161.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.161.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.162.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.162.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.162.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.163.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.163.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.163.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.164.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.164.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.164.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.165.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.165.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.165.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.166.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.166.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.166.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.167.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.167.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.167.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.168.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.168.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.168.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.169.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.169.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.169.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.17.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.17.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.17.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.170.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.170.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.170.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.171.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.171.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.171.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.172.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.172.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.172.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.173.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.173.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.173.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.174.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.174.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.174.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.175.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.175.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.175.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.176.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.176.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.176.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.177.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.177.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.177.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.178.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.178.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.178.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.179.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.179.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.179.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.18.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.18.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.18.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.180.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.180.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.180.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.181.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.181.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.181.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.182.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.182.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.182.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.183.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.183.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.183.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.184.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.184.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.184.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.185.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.185.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.185.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.186.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.186.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.186.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.187.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.187.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.187.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.188.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.188.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.188.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.189.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.189.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.189.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.19.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.19.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.19.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.190.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.190.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.190.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.191.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.191.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.191.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.192.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.192.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.192.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.193.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.193.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.193.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.194.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.194.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.194.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.195.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.195.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.195.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.196.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.196.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.196.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.197.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.197.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.197.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.198.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.198.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.198.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.199.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.199.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.199.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.2.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.2.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.2.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.20.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.20.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.20.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.200.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.200.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.200.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.201.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.201.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.201.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.202.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.202.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.202.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.203.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.203.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.203.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.204.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.204.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.204.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.205.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.205.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.205.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.206.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.206.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.206.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.207.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.207.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.207.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.208.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.208.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.208.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.209.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.209.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.209.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.21.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.21.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.21.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.210.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.210.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.210.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.211.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.211.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.211.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.212.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.212.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.212.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.213.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.213.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.213.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.214.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.214.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.214.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.215.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.215.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.215.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.216.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.216.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.216.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.217.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.217.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.217.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.218.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.218.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.218.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.219.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.219.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.219.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.22.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.22.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.22.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.220.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.220.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.220.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.221.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.221.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.221.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.222.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.222.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.222.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.223.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.223.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.223.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.224.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.224.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.224.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.225.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.225.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.225.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.226.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.226.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.226.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.227.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.227.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.227.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.228.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.228.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.228.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.229.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.229.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.229.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.23.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.23.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.23.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.230.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.230.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.230.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.231.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.231.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.231.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.232.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.232.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.232.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.233.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.233.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.233.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.234.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.234.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.234.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.235.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.235.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.235.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.236.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.236.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.236.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.237.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.237.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.237.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.238.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.238.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.238.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.239.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.239.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.239.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.24.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.24.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.24.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.240.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.240.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.240.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.241.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.241.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.241.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.242.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.242.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.242.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.243.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.243.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.243.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.244.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.244.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.244.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.245.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.245.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.245.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.246.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.246.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.246.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.247.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.247.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.247.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.248.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.248.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.248.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.249.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.249.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.249.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.25.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.25.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.25.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.250.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.250.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.250.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.251.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.251.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.251.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.252.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.252.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.252.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.253.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.253.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.253.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.254.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.254.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.254.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.255.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.255.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.255.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.26.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.26.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.26.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.27.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.27.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.27.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.28.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.28.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.28.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.29.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.29.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.29.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.3.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.3.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.3.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.30.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.30.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.30.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.31.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.31.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.31.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.32.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.32.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.32.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.33.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.33.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.33.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.34.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.34.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.34.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.35.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.35.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.35.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.36.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.36.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.36.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.37.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.37.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.37.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.38.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.38.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.38.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.39.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.39.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.39.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.4.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.4.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.4.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.40.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.40.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.40.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.41.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.41.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.41.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.42.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.42.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.42.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.43.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.43.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.43.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.44.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.44.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.44.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.45.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.45.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.45.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.46.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.46.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.46.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.47.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.47.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.47.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.48.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.48.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.48.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.49.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.49.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.49.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.5.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.5.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.5.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.50.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.50.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.50.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.51.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.51.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.51.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.52.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.52.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.52.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.53.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.53.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.53.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.54.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.54.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.54.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.55.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.55.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.55.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.56.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.56.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.56.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.57.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.57.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.57.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.58.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.58.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.58.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.59.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.59.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.59.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.6.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.6.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.6.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.60.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.60.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.60.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.61.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.61.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.61.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.62.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.62.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.62.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.63.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.63.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.63.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.64.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.64.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.64.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.65.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.65.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.65.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.66.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.66.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.66.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.67.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.67.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.67.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.68.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.68.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.68.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.69.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.69.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.69.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.7.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.7.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.7.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.70.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.70.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.70.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.71.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.71.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.71.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.72.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.72.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.72.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.73.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.73.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.73.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.74.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.74.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.74.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.75.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.75.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.75.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.76.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.76.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.76.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.77.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.77.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.77.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.78.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.78.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.78.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.79.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.79.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.79.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.8.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.8.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.8.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.80.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.80.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.80.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.81.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.81.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.81.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.82.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.82.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.82.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.83.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.83.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.83.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.84.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.84.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.84.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.85.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.85.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.85.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.86.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.86.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.86.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.87.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.87.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.87.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.88.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.88.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.88.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.89.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.89.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.89.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.9.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.9.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.9.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.90.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.90.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.90.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.91.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.91.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.91.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.92.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.92.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.92.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.93.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.93.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.93.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.94.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.94.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.94.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.95.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.95.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.95.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.96.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.96.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.96.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.97.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.97.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.97.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.98.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.98.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.98.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.99.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.99.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.experts.gate_up_proj_list.99.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.gate.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.shared_expert.down_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.shared_expert.down_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.shared_expert.down_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.shared_expert.gate_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.shared_expert.gate_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.shared_expert.gate_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.shared_expert.up_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.shared_expert.up_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.shared_expert.up_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.shared_expert_gate.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.shared_expert_gate.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.18.mlp.shared_expert_gate.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.18.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.19.input_layernorm.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.0.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.0.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.0.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.1.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.1.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.1.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.10.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.10.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.10.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.100.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.100.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.100.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.101.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.101.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.101.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.102.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.102.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.102.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.103.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.103.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.103.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.104.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.104.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.104.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.105.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.105.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.105.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.106.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.106.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.106.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.107.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.107.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.107.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.108.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.108.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.108.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.109.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.109.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.109.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.11.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.11.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.11.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.110.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.110.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.110.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.111.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.111.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.111.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.112.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.112.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.112.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.113.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.113.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.113.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.114.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.114.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.114.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.115.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.115.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.115.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.116.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.116.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.116.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.117.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.117.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.117.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.118.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.118.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.118.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.119.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.119.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.119.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.12.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.12.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.12.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.120.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.120.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.120.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.121.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.121.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.121.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.122.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.122.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.122.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.123.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.123.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.123.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.124.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.124.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.124.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.125.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.125.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.125.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.126.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.126.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.126.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.127.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.127.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.127.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.128.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.128.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.128.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.129.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.129.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.129.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.13.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.13.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.13.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.130.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.130.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.130.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.131.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.131.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.131.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.132.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.132.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.132.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.133.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.133.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.133.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.134.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.134.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.134.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.135.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.135.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.135.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.136.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.136.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.136.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.137.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.137.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.137.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.138.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.138.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.138.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.139.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.139.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.139.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.14.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.14.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.14.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.140.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.140.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.140.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.141.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.141.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.141.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.142.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.142.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.142.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.143.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.143.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.143.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.144.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.144.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.144.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.145.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.145.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.145.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.146.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.146.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.146.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.147.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.147.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.147.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.148.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.148.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.148.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.149.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.149.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.149.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.15.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.15.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.15.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.150.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.150.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.150.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.151.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.151.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.151.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.152.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.152.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.152.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.153.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.153.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.153.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.154.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.154.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.154.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.155.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.155.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.155.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.156.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.156.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.156.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.157.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.157.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.157.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.158.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.158.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.158.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.159.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.159.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.159.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.16.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.16.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.16.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.160.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.160.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.160.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.161.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.161.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.161.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.162.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.162.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.162.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.163.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.163.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.163.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.164.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.164.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.164.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.165.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.165.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.165.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.166.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.166.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.166.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.167.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.167.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.167.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.168.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.168.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.168.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.169.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.169.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.169.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.17.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.17.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.17.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.170.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.170.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.170.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.171.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.171.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.171.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.172.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.172.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.172.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.173.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.173.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.173.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.174.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.174.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.174.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.175.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.175.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.175.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.176.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.176.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.176.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.177.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.177.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.177.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.178.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.178.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.178.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.179.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.179.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.179.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.18.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.18.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.18.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.180.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.180.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.180.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.181.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.181.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.181.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.182.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.182.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.182.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.183.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.183.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.183.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.184.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.184.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.184.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.185.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.185.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.185.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.186.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.186.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.186.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.187.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.187.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.187.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.188.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.188.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.188.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.189.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.189.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.189.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.19.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.19.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.19.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.190.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.190.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.190.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.191.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.191.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.191.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.192.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.192.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.192.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.193.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.193.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.193.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.194.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.194.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.194.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.195.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.195.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.195.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.196.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.196.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.196.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.197.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.197.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.197.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.198.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.198.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.198.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.199.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.199.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.199.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.2.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.2.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.2.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.20.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.20.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.20.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.200.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.200.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.200.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.201.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.201.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.201.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.202.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.202.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.202.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.203.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.203.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.203.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.204.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.204.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.204.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.205.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.205.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.205.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.206.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.206.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.206.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.207.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.207.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.207.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.208.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.208.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.208.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.209.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.209.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.209.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.21.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.21.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.21.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.210.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.210.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.210.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.211.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.211.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.211.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.212.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.212.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.212.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.213.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.213.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.213.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.214.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.214.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.214.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.215.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.215.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.215.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.216.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.216.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.216.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.217.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.217.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.217.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.218.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.218.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.218.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.219.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.219.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.219.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.22.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.22.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.22.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.220.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.220.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.220.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.221.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.221.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.221.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.222.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.222.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.222.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.223.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.223.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.223.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.224.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.224.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.224.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.225.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.225.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.225.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.226.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.226.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.226.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.227.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.227.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.227.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.228.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.228.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.228.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.229.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.229.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.229.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.23.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.23.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.23.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.230.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.230.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.230.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.231.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.231.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.231.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.232.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.232.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.232.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.233.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.233.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.233.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.234.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.234.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.234.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.235.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.235.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.235.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.236.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.236.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.236.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.237.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.237.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.237.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.238.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.238.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.238.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.239.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.239.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.239.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.24.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.24.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.24.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.240.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.240.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.240.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.241.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.241.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.241.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.242.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.242.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.242.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.243.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.243.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.243.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.244.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.244.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.244.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.245.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.245.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.245.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.246.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.246.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.246.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.247.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.247.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.247.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.248.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.248.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.248.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.249.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.249.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.249.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.25.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.25.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.25.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.250.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.250.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.250.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.251.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.251.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.251.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.252.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.252.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.252.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.253.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.253.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.253.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.254.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.254.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.254.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.255.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.255.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.255.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.26.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.26.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.26.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.27.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.27.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.27.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.28.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.28.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.28.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.29.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.29.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.29.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.3.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.3.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.3.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.30.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.30.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.30.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.31.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.31.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.31.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.32.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.32.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.32.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.33.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.33.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.33.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.34.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.34.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.34.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.35.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.35.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.35.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.36.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.36.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.36.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.37.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.37.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.37.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.38.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.38.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.38.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.39.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.39.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.39.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.4.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.4.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.4.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.40.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.40.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.40.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.41.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.41.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.41.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.42.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.42.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.42.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.43.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.43.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.43.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.44.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.44.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.44.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.45.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.45.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.45.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.46.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.46.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.46.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.47.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.47.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.47.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.48.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.48.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.48.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.49.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.49.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.49.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.5.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.5.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.5.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.50.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.50.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.50.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.51.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.51.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.51.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.52.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.52.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.52.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.53.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.53.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.53.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.54.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.54.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.54.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.55.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.55.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.55.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.56.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.56.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.56.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.57.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.57.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.57.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.58.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.58.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.58.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.59.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.59.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.59.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.6.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.6.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.6.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.60.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.60.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.60.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.61.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.61.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.61.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.62.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.62.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.62.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.63.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.63.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.63.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.64.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.64.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.64.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.65.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.65.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.65.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.66.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.66.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.66.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.67.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.67.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.67.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.68.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.68.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.68.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.69.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.69.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.69.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.7.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.7.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.7.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.70.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.70.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.70.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.71.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.71.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.71.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.72.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.72.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.72.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.73.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.73.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.73.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.74.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.74.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.74.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.75.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.75.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.75.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.76.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.76.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.76.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.77.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.77.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.77.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.78.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.78.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.78.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.79.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.79.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.79.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.8.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.8.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.8.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.80.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.80.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.80.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.81.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.81.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.81.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.82.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.82.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.82.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.83.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.83.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.83.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.84.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.84.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.84.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.85.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.85.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.85.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.86.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.86.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.86.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.87.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.87.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.87.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.88.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.88.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.88.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.89.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.89.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.89.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.9.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.9.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.9.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.90.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.90.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.90.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.91.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.91.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.91.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.92.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.92.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.92.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.93.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.93.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.93.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.94.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.94.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.94.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.95.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.95.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.95.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.96.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.96.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.96.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.97.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.97.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.97.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.98.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.98.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.98.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.99.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.99.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.down_proj_list.99.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.0.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.0.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.0.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.1.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.1.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.1.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.10.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.10.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.10.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.100.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.100.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.100.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.101.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.101.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.101.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.102.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.102.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.102.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.103.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.103.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.103.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.104.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.104.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.104.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.105.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.105.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.105.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.106.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.106.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.106.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.107.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.107.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.107.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.108.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.108.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.108.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.109.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.109.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.109.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.11.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.11.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.11.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.110.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.110.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.110.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.111.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.111.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.111.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.112.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.112.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.112.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.113.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.113.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.113.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.114.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.114.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.114.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.115.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.115.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.115.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.116.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.116.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.116.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.117.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.117.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.117.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.118.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.118.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.118.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.119.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.119.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.119.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.12.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.12.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.12.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.120.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.120.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.120.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.121.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.121.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.121.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.122.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.122.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.122.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.123.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.123.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.123.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.124.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.124.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.124.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.125.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.125.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.125.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.126.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.126.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.126.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.127.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.127.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.127.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.128.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.128.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.128.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.129.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.129.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.129.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.13.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.13.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.13.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.130.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.130.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.130.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.131.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.131.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.131.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.132.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.132.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.132.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.133.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.133.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.133.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.134.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.134.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.134.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.135.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.135.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.135.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.136.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.136.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.136.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.137.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.137.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.137.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.138.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.138.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.138.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.139.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.139.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.139.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.14.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.14.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.14.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.140.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.140.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.140.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.141.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.141.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.141.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.142.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.142.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.142.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.143.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.143.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.143.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.144.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.144.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.144.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.145.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.145.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.145.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.146.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.146.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.146.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.147.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.147.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.147.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.148.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.148.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.148.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.149.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.149.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.149.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.15.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.15.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.15.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.150.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.150.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.150.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.151.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.151.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.151.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.152.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.152.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.152.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.153.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.153.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.153.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.154.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.154.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.154.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.155.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.155.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.155.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.156.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.156.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.156.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.157.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.157.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.157.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.158.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.158.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.158.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.159.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.159.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.159.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.16.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.16.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.16.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.160.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.160.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.160.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.161.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.161.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.161.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.162.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.162.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.162.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.163.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.163.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.163.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.164.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.164.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.164.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.165.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.165.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.165.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.166.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.166.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.166.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.167.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.167.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.167.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.168.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.168.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.168.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.169.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.169.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.169.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.17.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.17.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.17.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.170.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.170.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.170.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.171.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.171.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.171.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.172.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.172.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.172.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.173.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.173.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.173.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.174.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.174.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.174.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.175.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.175.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.175.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.176.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.176.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.176.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.177.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.177.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.177.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.178.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.178.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.178.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.179.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.179.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.179.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.18.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.18.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.18.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.180.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.180.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.180.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.181.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.181.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.181.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.182.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.182.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.182.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.183.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.183.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.183.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.184.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.184.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.184.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.185.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.185.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.185.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.186.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.186.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.186.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.187.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.187.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.187.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.188.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.188.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.188.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.189.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.189.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.189.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.19.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.19.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.19.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.190.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.190.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.190.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.191.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.191.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.191.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.192.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.192.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.192.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.193.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.193.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.193.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.194.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.194.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.194.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.195.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.195.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.195.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.196.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.196.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.196.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.197.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.197.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.197.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.198.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.198.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.198.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.199.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.199.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.199.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.2.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.2.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.2.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.20.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.20.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.20.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.200.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.200.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.200.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.201.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.201.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.201.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.202.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.202.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.202.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.203.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.203.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.203.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.204.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.204.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.204.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.205.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.205.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.205.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.206.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.206.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.206.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.207.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.207.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.207.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.208.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.208.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.208.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.209.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.209.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.209.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.21.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.21.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.21.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.210.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.210.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.210.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.211.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.211.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.211.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.212.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.212.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.212.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.213.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.213.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.213.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.214.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.214.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.214.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.215.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.215.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.215.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.216.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.216.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.216.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.217.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.217.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.217.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.218.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.218.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.218.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.219.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.219.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.219.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.22.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.22.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.22.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.220.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.220.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.220.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.221.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.221.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.221.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.222.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.222.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.222.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.223.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.223.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.223.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.224.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.224.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.224.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.225.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.225.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.225.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.226.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.226.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.226.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.227.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.227.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.227.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.228.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.228.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.228.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.229.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.229.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.229.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.23.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.23.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.23.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.230.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.230.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.230.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.231.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.231.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.231.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.232.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.232.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.232.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.233.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.233.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.233.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.234.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.234.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.234.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.235.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.235.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.235.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.236.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.236.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.236.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.237.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.237.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.237.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.238.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.238.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.238.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.239.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.239.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.239.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.24.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.24.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.24.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.240.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.240.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.240.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.241.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.241.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.241.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.242.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.242.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.242.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.243.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.243.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.243.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.244.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.244.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.244.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.245.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.245.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.245.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.246.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.246.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.246.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.247.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.247.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.247.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.248.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.248.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.248.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.249.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.249.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.249.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.25.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.25.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.25.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.250.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.250.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.250.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.251.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.251.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.251.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.252.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.252.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.252.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.253.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.253.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.253.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.254.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.254.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.254.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.255.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.255.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.255.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.26.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.26.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.26.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.27.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.27.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.27.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.28.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.28.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.28.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.29.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.29.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.29.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.3.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.3.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.3.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.30.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.30.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.30.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.31.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.31.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.31.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.32.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.32.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.32.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.33.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.33.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.33.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.34.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.34.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.34.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.35.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.35.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.35.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.36.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.36.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.36.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.37.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.37.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.37.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.38.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.38.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.38.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.39.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.39.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.39.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.4.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.4.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.4.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.40.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.40.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.40.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.41.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.41.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.41.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.42.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.42.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.42.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.43.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.43.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.43.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.44.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.44.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.44.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.45.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.45.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.45.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.46.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.46.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.46.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.47.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.47.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.47.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.48.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.48.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.48.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.49.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.49.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.49.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.5.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.5.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.5.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.50.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.50.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.50.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.51.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.51.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.51.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.52.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.52.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.52.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.53.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.53.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.53.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.54.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.54.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.54.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.55.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.55.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.55.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.56.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.56.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.56.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.57.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.57.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.57.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.58.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.58.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.58.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.59.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.59.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.59.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.6.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.6.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.6.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.60.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.60.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.60.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.61.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.61.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.61.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.62.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.62.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.62.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.63.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.63.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.63.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.64.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.64.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.64.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.65.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.65.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.65.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.66.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.66.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.66.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.67.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.67.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.67.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.68.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.68.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.68.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.69.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.69.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.69.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.7.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.7.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.7.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.70.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.70.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.70.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.71.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.71.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.71.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.72.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.72.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.72.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.73.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.73.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.73.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.74.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.74.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.74.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.75.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.75.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.75.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.76.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.76.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.76.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.77.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.77.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.77.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.78.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.78.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.78.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.79.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.79.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.79.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.8.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.8.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.8.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.80.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.80.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.80.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.81.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.81.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.81.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.82.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.82.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.82.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.83.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.83.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.83.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.84.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.84.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.84.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.85.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.85.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.85.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.86.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.86.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.86.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.87.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.87.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.87.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.88.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.88.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.88.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.89.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.89.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.89.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.9.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.9.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.9.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.90.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.90.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.90.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.91.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.91.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.91.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.92.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.92.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.92.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.93.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.93.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.93.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.94.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.94.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.94.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.95.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.95.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.95.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.96.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.96.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.96.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.97.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.97.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.97.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.98.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.98.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.98.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.99.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.99.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.experts.gate_up_proj_list.99.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.gate.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.shared_expert.down_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.shared_expert.down_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.shared_expert.down_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.shared_expert.gate_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.shared_expert.gate_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.shared_expert.gate_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.shared_expert.up_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.shared_expert.up_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.shared_expert.up_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.shared_expert_gate.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.shared_expert_gate.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.mlp.shared_expert_gate.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.19.self_attn.k_norm.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.19.self_attn.k_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.self_attn.k_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.self_attn.k_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.self_attn.o_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.self_attn.o_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.self_attn.o_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.self_attn.q_norm.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.19.self_attn.q_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.self_attn.q_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.self_attn.q_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.19.self_attn.v_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.19.self_attn.v_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.19.self_attn.v_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.2.input_layernorm.weight": "model-00001-of-00004.safetensors", "model.language_model.layers.2.linear_attn.A_log": "model-00001-of-00004.safetensors", "model.language_model.layers.2.linear_attn.conv1d.weight": "model-00001-of-00004.safetensors", "model.language_model.layers.2.linear_attn.dt_bias": "model-00001-of-00004.safetensors", "model.language_model.layers.2.linear_attn.in_proj_a.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.linear_attn.in_proj_a.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.linear_attn.in_proj_a.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.linear_attn.in_proj_b.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.linear_attn.in_proj_b.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.linear_attn.in_proj_b.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.linear_attn.in_proj_qkv.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.linear_attn.in_proj_qkv.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.linear_attn.in_proj_qkv.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.linear_attn.in_proj_z.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.linear_attn.in_proj_z.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.linear_attn.in_proj_z.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.linear_attn.norm.weight": "model-00001-of-00004.safetensors", "model.language_model.layers.2.linear_attn.out_proj.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.linear_attn.out_proj.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.linear_attn.out_proj.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.0.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.0.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.0.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.1.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.1.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.1.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.10.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.10.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.10.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.100.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.100.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.100.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.101.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.101.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.101.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.102.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.102.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.102.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.103.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.103.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.103.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.104.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.104.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.104.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.105.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.105.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.105.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.106.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.106.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.106.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.107.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.107.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.107.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.108.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.108.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.108.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.109.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.109.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.109.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.11.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.11.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.11.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.110.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.110.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.110.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.111.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.111.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.111.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.112.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.112.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.112.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.113.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.113.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.113.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.114.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.114.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.114.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.115.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.115.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.115.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.116.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.116.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.116.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.117.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.117.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.117.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.118.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.118.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.118.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.119.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.119.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.119.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.12.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.12.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.12.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.120.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.120.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.120.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.121.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.121.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.121.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.122.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.122.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.122.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.123.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.123.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.123.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.124.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.124.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.124.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.125.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.125.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.125.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.126.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.126.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.126.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.127.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.127.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.127.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.128.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.128.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.128.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.129.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.129.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.129.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.13.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.13.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.13.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.130.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.130.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.130.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.131.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.131.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.131.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.132.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.132.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.132.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.133.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.133.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.133.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.134.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.134.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.134.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.135.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.135.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.135.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.136.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.136.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.136.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.137.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.137.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.137.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.138.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.138.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.138.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.139.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.139.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.139.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.14.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.14.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.14.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.140.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.140.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.140.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.141.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.141.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.141.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.142.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.142.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.142.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.143.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.143.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.143.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.144.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.144.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.144.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.145.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.145.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.145.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.146.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.146.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.146.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.147.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.147.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.147.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.148.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.148.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.148.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.149.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.149.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.149.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.15.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.15.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.15.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.150.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.150.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.150.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.151.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.151.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.151.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.152.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.152.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.152.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.153.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.153.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.153.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.154.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.154.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.154.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.155.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.155.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.155.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.156.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.156.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.156.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.157.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.157.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.157.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.158.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.158.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.158.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.159.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.159.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.159.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.16.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.16.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.16.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.160.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.160.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.160.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.161.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.161.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.161.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.162.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.162.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.162.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.163.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.163.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.163.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.164.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.164.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.164.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.165.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.165.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.165.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.166.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.166.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.166.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.167.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.167.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.167.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.168.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.168.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.168.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.169.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.169.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.169.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.17.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.17.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.17.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.170.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.170.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.170.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.171.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.171.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.171.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.172.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.172.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.172.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.173.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.173.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.173.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.174.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.174.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.174.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.175.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.175.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.175.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.176.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.176.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.176.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.177.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.177.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.177.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.178.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.178.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.178.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.179.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.179.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.179.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.18.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.18.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.18.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.180.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.180.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.180.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.181.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.181.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.181.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.182.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.182.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.182.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.183.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.183.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.183.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.184.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.184.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.184.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.185.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.185.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.185.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.186.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.186.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.186.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.187.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.187.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.187.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.188.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.188.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.188.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.189.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.189.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.189.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.19.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.19.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.19.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.190.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.190.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.190.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.191.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.191.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.191.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.192.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.192.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.192.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.193.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.193.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.193.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.194.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.194.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.194.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.195.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.195.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.195.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.196.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.196.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.196.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.197.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.197.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.197.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.198.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.198.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.198.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.199.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.199.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.199.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.2.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.2.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.2.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.20.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.20.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.20.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.200.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.200.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.200.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.201.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.201.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.201.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.202.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.202.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.202.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.203.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.203.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.203.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.204.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.204.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.204.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.205.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.205.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.205.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.206.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.206.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.206.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.207.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.207.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.207.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.208.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.208.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.208.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.209.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.209.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.209.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.21.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.21.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.21.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.210.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.210.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.210.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.211.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.211.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.211.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.212.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.212.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.212.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.213.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.213.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.213.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.214.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.214.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.214.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.215.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.215.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.215.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.216.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.216.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.216.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.217.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.217.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.217.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.218.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.218.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.218.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.219.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.219.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.219.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.22.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.22.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.22.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.220.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.220.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.220.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.221.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.221.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.221.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.222.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.222.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.222.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.223.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.223.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.223.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.224.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.224.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.224.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.225.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.225.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.225.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.226.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.226.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.226.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.227.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.227.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.227.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.228.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.228.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.228.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.229.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.229.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.229.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.23.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.23.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.23.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.230.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.230.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.230.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.231.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.231.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.231.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.232.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.232.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.232.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.233.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.233.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.233.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.234.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.234.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.234.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.235.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.235.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.235.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.236.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.236.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.236.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.237.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.237.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.237.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.238.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.238.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.238.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.239.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.239.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.239.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.24.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.24.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.24.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.240.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.240.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.240.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.241.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.241.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.241.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.242.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.242.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.242.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.243.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.243.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.243.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.244.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.244.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.244.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.245.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.245.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.245.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.246.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.246.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.246.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.247.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.247.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.247.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.248.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.248.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.248.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.249.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.249.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.249.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.25.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.25.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.25.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.250.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.250.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.250.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.251.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.251.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.251.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.252.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.252.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.252.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.253.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.253.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.253.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.254.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.254.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.254.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.255.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.255.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.255.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.26.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.26.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.26.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.27.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.27.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.27.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.28.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.28.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.28.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.29.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.29.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.29.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.3.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.3.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.3.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.30.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.30.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.30.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.31.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.31.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.31.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.32.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.32.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.32.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.33.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.33.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.33.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.34.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.34.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.34.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.35.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.35.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.35.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.36.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.36.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.36.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.37.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.37.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.37.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.38.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.38.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.38.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.39.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.39.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.39.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.4.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.4.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.4.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.40.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.40.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.40.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.41.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.41.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.41.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.42.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.42.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.42.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.43.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.43.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.43.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.44.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.44.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.44.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.45.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.45.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.45.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.46.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.46.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.46.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.47.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.47.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.47.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.48.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.48.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.48.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.49.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.49.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.49.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.5.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.5.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.5.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.50.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.50.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.50.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.51.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.51.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.51.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.52.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.52.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.52.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.53.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.53.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.53.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.54.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.54.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.54.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.55.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.55.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.55.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.56.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.56.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.56.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.57.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.57.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.57.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.58.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.58.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.58.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.59.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.59.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.59.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.6.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.6.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.6.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.60.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.60.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.60.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.61.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.61.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.61.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.62.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.62.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.62.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.63.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.63.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.63.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.64.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.64.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.64.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.65.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.65.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.65.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.66.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.66.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.66.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.67.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.67.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.67.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.68.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.68.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.68.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.69.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.69.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.69.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.7.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.7.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.7.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.70.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.70.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.70.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.71.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.71.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.71.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.72.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.72.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.72.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.73.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.73.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.73.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.74.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.74.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.74.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.75.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.75.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.75.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.76.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.76.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.76.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.77.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.77.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.77.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.78.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.78.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.78.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.79.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.79.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.79.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.8.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.8.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.8.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.80.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.80.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.80.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.81.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.81.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.81.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.82.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.82.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.82.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.83.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.83.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.83.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.84.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.84.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.84.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.85.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.85.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.85.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.86.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.86.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.86.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.87.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.87.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.87.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.88.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.88.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.88.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.89.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.89.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.89.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.9.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.9.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.9.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.90.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.90.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.90.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.91.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.91.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.91.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.92.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.92.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.92.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.93.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.93.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.93.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.94.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.94.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.94.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.95.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.95.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.95.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.96.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.96.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.96.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.97.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.97.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.97.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.98.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.98.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.98.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.99.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.99.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.down_proj_list.99.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.0.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.0.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.0.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.1.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.1.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.1.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.10.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.10.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.10.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.100.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.100.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.100.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.101.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.101.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.101.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.102.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.102.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.102.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.103.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.103.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.103.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.104.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.104.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.104.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.105.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.105.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.105.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.106.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.106.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.106.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.107.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.107.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.107.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.108.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.108.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.108.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.109.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.109.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.109.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.11.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.11.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.11.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.110.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.110.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.110.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.111.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.111.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.111.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.112.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.112.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.112.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.113.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.113.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.113.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.114.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.114.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.114.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.115.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.115.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.115.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.116.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.116.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.116.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.117.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.117.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.117.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.118.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.118.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.118.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.119.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.119.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.119.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.12.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.12.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.12.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.120.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.120.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.120.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.121.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.121.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.121.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.122.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.122.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.122.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.123.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.123.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.123.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.124.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.124.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.124.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.125.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.125.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.125.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.126.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.126.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.126.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.127.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.127.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.127.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.128.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.128.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.128.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.129.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.129.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.129.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.13.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.13.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.13.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.130.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.130.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.130.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.131.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.131.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.131.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.132.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.132.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.132.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.133.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.133.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.133.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.134.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.134.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.134.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.135.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.135.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.135.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.136.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.136.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.136.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.137.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.137.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.137.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.138.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.138.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.138.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.139.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.139.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.139.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.14.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.14.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.14.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.140.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.140.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.140.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.141.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.141.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.141.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.142.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.142.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.142.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.143.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.143.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.143.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.144.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.144.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.144.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.145.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.145.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.145.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.146.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.146.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.146.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.147.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.147.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.147.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.148.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.148.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.148.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.149.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.149.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.149.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.15.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.15.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.15.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.150.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.150.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.150.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.151.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.151.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.151.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.152.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.152.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.152.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.153.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.153.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.153.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.154.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.154.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.154.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.155.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.155.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.155.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.156.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.156.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.156.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.157.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.157.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.157.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.158.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.158.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.158.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.159.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.159.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.159.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.16.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.16.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.16.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.160.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.160.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.160.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.161.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.161.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.161.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.162.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.162.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.162.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.163.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.163.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.163.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.164.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.164.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.164.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.165.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.165.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.165.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.166.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.166.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.166.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.167.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.167.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.167.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.168.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.168.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.168.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.169.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.169.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.169.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.17.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.17.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.17.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.170.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.170.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.170.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.171.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.171.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.171.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.172.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.172.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.172.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.173.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.173.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.173.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.174.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.174.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.174.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.175.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.175.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.175.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.176.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.176.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.176.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.177.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.177.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.177.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.178.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.178.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.178.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.179.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.179.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.179.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.18.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.18.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.18.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.180.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.180.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.180.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.181.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.181.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.181.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.182.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.182.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.182.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.183.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.183.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.183.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.184.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.184.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.184.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.185.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.185.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.185.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.186.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.186.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.186.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.187.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.187.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.187.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.188.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.188.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.188.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.189.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.189.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.189.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.19.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.19.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.19.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.190.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.190.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.190.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.191.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.191.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.191.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.192.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.192.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.192.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.193.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.193.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.193.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.194.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.194.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.194.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.195.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.195.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.195.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.196.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.196.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.196.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.197.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.197.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.197.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.198.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.198.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.198.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.199.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.199.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.199.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.2.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.2.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.2.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.20.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.20.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.20.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.200.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.200.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.200.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.201.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.201.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.201.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.202.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.202.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.202.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.203.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.203.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.203.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.204.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.204.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.204.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.205.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.205.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.205.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.206.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.206.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.206.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.207.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.207.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.207.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.208.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.208.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.208.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.209.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.209.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.209.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.21.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.21.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.21.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.210.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.210.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.210.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.211.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.211.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.211.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.212.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.212.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.212.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.213.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.213.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.213.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.214.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.214.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.214.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.215.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.215.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.215.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.216.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.216.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.216.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.217.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.217.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.217.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.218.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.218.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.218.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.219.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.219.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.219.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.22.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.22.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.22.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.220.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.220.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.220.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.221.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.221.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.221.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.222.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.222.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.222.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.223.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.223.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.223.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.224.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.224.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.224.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.225.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.225.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.225.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.226.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.226.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.226.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.227.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.227.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.227.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.228.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.228.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.228.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.229.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.229.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.229.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.23.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.23.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.23.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.230.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.230.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.230.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.231.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.231.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.231.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.232.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.232.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.232.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.233.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.233.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.233.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.234.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.234.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.234.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.235.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.235.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.235.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.236.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.236.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.236.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.237.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.237.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.237.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.238.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.238.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.238.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.239.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.239.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.239.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.24.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.24.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.24.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.240.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.240.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.240.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.241.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.241.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.241.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.242.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.242.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.242.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.243.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.243.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.243.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.244.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.244.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.244.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.245.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.245.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.245.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.246.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.246.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.246.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.247.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.247.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.247.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.248.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.248.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.248.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.249.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.249.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.249.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.25.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.25.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.25.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.250.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.250.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.250.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.251.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.251.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.251.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.252.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.252.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.252.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.253.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.253.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.253.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.254.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.254.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.254.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.255.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.255.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.255.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.26.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.26.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.26.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.27.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.27.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.27.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.28.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.28.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.28.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.29.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.29.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.29.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.3.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.3.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.3.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.30.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.30.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.30.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.31.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.31.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.31.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.32.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.32.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.32.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.33.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.33.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.33.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.34.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.34.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.34.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.35.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.35.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.35.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.36.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.36.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.36.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.37.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.37.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.37.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.38.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.38.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.38.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.39.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.39.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.39.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.4.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.4.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.4.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.40.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.40.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.40.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.41.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.41.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.41.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.42.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.42.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.42.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.43.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.43.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.43.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.44.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.44.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.44.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.45.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.45.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.45.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.46.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.46.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.46.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.47.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.47.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.47.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.48.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.48.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.48.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.49.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.49.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.49.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.5.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.5.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.5.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.50.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.50.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.50.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.51.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.51.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.51.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.52.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.52.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.52.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.53.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.53.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.53.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.54.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.54.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.54.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.55.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.55.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.55.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.56.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.56.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.56.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.57.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.57.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.57.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.58.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.58.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.58.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.59.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.59.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.59.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.6.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.6.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.6.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.60.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.60.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.60.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.61.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.61.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.61.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.62.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.62.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.62.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.63.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.63.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.63.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.64.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.64.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.64.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.65.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.65.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.65.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.66.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.66.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.66.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.67.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.67.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.67.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.68.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.68.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.68.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.69.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.69.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.69.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.7.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.7.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.7.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.70.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.70.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.70.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.71.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.71.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.71.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.72.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.72.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.72.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.73.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.73.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.73.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.74.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.74.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.74.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.75.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.75.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.75.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.76.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.76.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.76.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.77.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.77.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.77.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.78.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.78.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.78.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.79.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.79.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.79.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.8.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.8.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.8.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.80.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.80.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.80.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.81.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.81.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.81.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.82.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.82.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.82.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.83.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.83.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.83.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.84.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.84.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.84.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.85.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.85.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.85.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.86.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.86.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.86.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.87.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.87.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.87.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.88.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.88.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.88.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.89.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.89.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.89.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.9.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.9.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.9.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.90.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.90.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.90.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.91.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.91.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.91.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.92.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.92.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.92.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.93.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.93.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.93.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.94.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.94.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.94.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.95.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.95.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.95.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.96.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.96.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.96.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.97.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.97.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.97.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.98.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.98.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.98.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.99.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.99.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.experts.gate_up_proj_list.99.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.gate.weight": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.shared_expert.down_proj.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.shared_expert.down_proj.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.shared_expert.down_proj.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.shared_expert.gate_proj.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.shared_expert.gate_proj.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.shared_expert.gate_proj.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.shared_expert.up_proj.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.shared_expert.up_proj.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.shared_expert.up_proj.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.shared_expert_gate.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.shared_expert_gate.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.2.mlp.shared_expert_gate.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.2.post_attention_layernorm.weight": "model-00001-of-00004.safetensors", "model.language_model.layers.20.input_layernorm.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.20.linear_attn.A_log": "model-00002-of-00004.safetensors", "model.language_model.layers.20.linear_attn.conv1d.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.20.linear_attn.dt_bias": "model-00002-of-00004.safetensors", "model.language_model.layers.20.linear_attn.in_proj_a.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.linear_attn.in_proj_a.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.linear_attn.in_proj_a.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.linear_attn.in_proj_b.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.linear_attn.in_proj_b.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.linear_attn.in_proj_b.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.linear_attn.in_proj_qkv.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.linear_attn.in_proj_qkv.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.linear_attn.in_proj_qkv.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.linear_attn.in_proj_z.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.linear_attn.in_proj_z.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.linear_attn.in_proj_z.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.linear_attn.norm.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.20.linear_attn.out_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.linear_attn.out_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.linear_attn.out_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.0.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.0.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.0.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.1.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.1.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.1.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.10.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.10.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.10.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.100.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.100.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.100.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.101.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.101.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.101.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.102.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.102.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.102.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.103.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.103.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.103.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.104.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.104.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.104.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.105.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.105.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.105.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.106.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.106.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.106.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.107.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.107.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.107.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.108.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.108.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.108.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.109.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.109.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.109.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.11.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.11.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.11.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.110.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.110.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.110.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.111.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.111.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.111.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.112.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.112.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.112.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.113.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.113.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.113.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.114.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.114.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.114.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.115.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.115.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.115.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.116.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.116.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.116.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.117.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.117.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.117.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.118.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.118.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.118.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.119.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.119.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.119.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.12.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.12.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.12.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.120.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.120.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.120.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.121.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.121.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.121.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.122.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.122.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.122.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.123.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.123.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.123.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.124.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.124.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.124.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.125.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.125.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.125.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.126.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.126.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.126.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.127.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.127.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.127.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.128.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.128.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.128.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.129.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.129.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.129.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.13.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.13.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.13.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.130.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.130.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.130.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.131.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.131.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.131.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.132.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.132.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.132.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.133.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.133.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.133.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.134.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.134.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.134.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.135.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.135.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.135.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.136.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.136.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.136.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.137.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.137.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.137.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.138.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.138.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.138.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.139.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.139.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.139.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.14.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.14.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.14.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.140.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.140.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.140.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.141.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.141.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.141.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.142.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.142.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.142.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.143.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.143.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.143.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.144.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.144.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.144.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.145.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.145.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.145.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.146.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.146.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.146.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.147.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.147.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.147.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.148.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.148.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.148.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.149.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.149.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.149.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.15.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.15.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.15.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.150.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.150.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.150.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.151.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.151.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.151.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.152.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.152.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.152.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.153.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.153.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.153.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.154.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.154.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.154.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.155.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.155.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.155.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.156.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.156.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.156.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.157.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.157.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.157.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.158.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.158.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.158.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.159.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.159.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.159.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.16.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.16.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.16.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.160.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.160.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.160.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.161.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.161.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.161.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.162.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.162.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.162.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.163.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.163.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.163.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.164.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.164.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.164.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.165.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.165.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.165.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.166.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.166.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.166.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.167.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.167.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.167.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.168.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.168.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.168.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.169.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.169.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.169.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.17.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.17.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.17.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.170.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.170.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.170.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.171.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.171.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.171.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.172.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.172.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.172.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.173.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.173.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.173.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.174.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.174.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.174.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.175.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.175.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.175.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.176.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.176.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.176.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.177.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.177.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.177.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.178.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.178.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.178.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.179.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.179.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.179.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.18.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.18.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.18.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.180.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.180.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.180.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.181.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.181.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.181.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.182.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.182.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.182.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.183.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.183.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.183.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.184.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.184.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.184.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.185.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.185.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.185.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.186.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.186.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.186.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.187.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.187.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.187.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.188.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.188.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.188.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.189.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.189.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.189.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.19.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.19.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.19.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.190.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.190.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.190.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.191.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.191.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.191.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.192.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.192.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.192.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.193.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.193.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.193.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.194.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.194.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.194.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.195.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.195.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.195.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.196.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.196.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.196.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.197.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.197.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.197.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.198.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.198.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.198.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.199.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.199.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.199.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.2.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.2.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.2.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.20.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.20.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.20.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.200.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.200.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.200.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.201.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.201.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.201.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.202.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.202.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.202.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.203.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.203.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.203.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.204.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.204.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.204.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.205.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.205.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.205.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.206.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.206.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.206.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.207.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.207.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.207.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.208.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.208.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.208.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.209.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.209.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.209.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.21.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.21.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.21.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.210.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.210.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.210.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.211.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.211.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.211.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.212.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.212.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.212.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.213.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.213.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.213.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.214.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.214.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.214.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.215.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.215.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.215.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.216.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.216.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.216.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.217.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.217.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.217.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.218.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.218.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.218.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.219.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.219.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.219.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.22.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.22.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.22.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.220.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.220.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.220.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.221.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.221.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.221.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.222.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.222.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.222.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.223.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.223.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.223.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.224.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.224.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.224.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.225.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.225.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.225.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.226.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.226.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.226.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.227.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.227.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.227.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.228.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.228.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.228.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.229.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.229.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.229.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.23.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.23.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.23.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.230.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.230.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.230.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.231.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.231.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.231.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.232.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.232.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.232.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.233.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.233.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.233.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.234.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.234.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.234.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.235.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.235.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.235.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.236.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.236.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.236.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.237.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.237.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.237.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.238.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.238.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.238.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.239.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.239.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.239.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.24.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.24.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.24.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.240.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.240.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.240.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.241.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.241.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.241.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.242.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.242.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.242.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.243.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.243.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.243.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.244.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.244.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.244.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.245.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.245.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.245.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.246.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.246.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.246.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.247.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.247.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.247.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.248.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.248.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.248.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.249.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.249.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.249.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.25.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.25.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.25.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.250.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.250.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.250.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.251.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.251.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.251.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.252.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.252.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.252.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.253.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.253.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.253.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.254.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.254.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.254.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.255.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.255.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.255.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.26.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.26.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.26.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.27.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.27.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.27.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.28.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.28.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.28.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.29.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.29.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.29.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.3.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.3.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.3.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.30.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.30.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.30.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.31.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.31.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.31.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.32.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.32.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.32.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.33.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.33.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.33.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.34.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.34.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.34.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.35.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.35.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.35.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.36.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.36.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.36.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.37.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.37.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.37.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.38.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.38.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.38.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.39.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.39.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.39.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.4.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.4.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.4.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.40.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.40.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.40.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.41.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.41.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.41.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.42.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.42.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.42.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.43.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.43.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.43.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.44.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.44.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.44.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.45.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.45.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.45.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.46.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.46.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.46.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.47.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.47.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.47.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.48.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.48.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.48.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.49.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.49.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.49.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.5.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.5.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.5.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.50.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.50.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.50.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.51.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.51.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.51.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.52.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.52.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.52.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.53.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.53.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.53.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.54.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.54.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.54.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.55.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.55.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.55.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.56.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.56.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.56.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.57.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.57.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.57.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.58.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.58.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.58.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.59.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.59.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.59.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.6.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.6.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.6.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.60.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.60.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.60.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.61.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.61.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.61.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.62.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.62.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.62.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.63.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.63.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.63.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.64.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.64.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.64.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.65.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.65.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.65.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.66.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.66.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.66.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.67.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.67.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.67.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.68.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.68.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.68.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.69.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.69.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.69.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.7.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.7.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.7.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.70.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.70.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.70.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.71.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.71.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.71.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.72.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.72.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.72.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.73.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.73.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.73.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.74.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.74.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.74.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.75.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.75.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.75.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.76.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.76.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.76.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.77.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.77.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.77.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.78.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.78.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.78.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.79.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.79.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.79.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.8.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.8.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.8.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.80.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.80.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.80.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.81.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.81.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.81.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.82.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.82.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.82.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.83.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.83.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.83.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.84.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.84.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.84.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.85.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.85.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.85.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.86.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.86.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.86.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.87.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.87.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.87.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.88.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.88.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.88.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.89.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.89.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.89.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.9.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.9.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.9.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.90.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.90.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.90.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.91.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.91.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.91.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.92.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.92.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.92.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.93.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.93.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.93.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.94.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.94.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.94.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.95.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.95.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.95.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.96.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.96.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.96.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.97.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.97.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.97.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.98.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.98.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.98.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.99.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.99.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.down_proj_list.99.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.0.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.0.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.0.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.1.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.1.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.1.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.10.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.10.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.10.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.100.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.100.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.100.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.101.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.101.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.101.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.102.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.102.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.102.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.103.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.103.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.103.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.104.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.104.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.104.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.105.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.105.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.105.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.106.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.106.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.106.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.107.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.107.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.107.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.108.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.108.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.108.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.109.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.109.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.109.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.11.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.11.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.11.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.110.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.110.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.110.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.111.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.111.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.111.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.112.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.112.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.112.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.113.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.113.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.113.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.114.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.114.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.114.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.115.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.115.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.115.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.116.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.116.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.116.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.117.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.117.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.117.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.118.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.118.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.118.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.119.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.119.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.119.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.12.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.12.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.12.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.120.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.120.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.120.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.121.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.121.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.121.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.122.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.122.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.122.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.123.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.123.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.123.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.124.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.124.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.124.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.125.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.125.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.125.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.126.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.126.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.126.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.127.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.127.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.127.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.128.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.128.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.128.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.129.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.129.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.129.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.13.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.13.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.13.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.130.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.130.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.130.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.131.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.131.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.131.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.132.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.132.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.132.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.133.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.133.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.133.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.134.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.134.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.134.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.135.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.135.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.135.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.136.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.136.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.136.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.137.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.137.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.137.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.138.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.138.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.138.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.139.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.139.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.139.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.14.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.14.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.14.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.140.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.140.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.140.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.141.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.141.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.141.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.142.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.142.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.142.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.143.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.143.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.143.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.144.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.144.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.144.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.145.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.145.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.145.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.146.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.146.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.146.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.147.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.147.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.147.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.148.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.148.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.148.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.149.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.149.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.149.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.15.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.15.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.15.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.150.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.150.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.150.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.151.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.151.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.151.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.152.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.152.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.152.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.153.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.153.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.153.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.154.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.154.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.154.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.155.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.155.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.155.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.156.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.156.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.156.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.157.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.157.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.157.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.158.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.158.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.158.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.159.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.159.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.159.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.16.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.16.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.16.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.160.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.160.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.160.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.161.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.161.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.161.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.162.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.162.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.162.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.163.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.163.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.163.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.164.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.164.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.164.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.165.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.165.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.165.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.166.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.166.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.166.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.167.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.167.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.167.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.168.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.168.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.168.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.169.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.169.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.169.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.17.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.17.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.17.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.170.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.170.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.170.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.171.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.171.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.171.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.172.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.172.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.172.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.173.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.173.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.173.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.174.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.174.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.174.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.175.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.175.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.175.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.176.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.176.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.176.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.177.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.177.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.177.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.178.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.178.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.178.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.179.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.179.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.179.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.18.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.18.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.18.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.180.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.180.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.180.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.181.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.181.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.181.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.182.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.182.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.182.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.183.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.183.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.183.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.184.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.184.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.184.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.185.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.185.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.185.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.186.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.186.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.186.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.187.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.187.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.187.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.188.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.188.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.188.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.189.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.189.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.189.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.19.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.19.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.19.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.190.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.190.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.190.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.191.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.191.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.191.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.192.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.192.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.192.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.193.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.193.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.193.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.194.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.194.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.194.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.195.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.195.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.195.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.196.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.196.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.196.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.197.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.197.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.197.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.198.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.198.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.198.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.199.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.199.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.199.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.2.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.2.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.2.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.20.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.20.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.20.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.200.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.200.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.200.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.201.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.201.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.201.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.202.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.202.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.202.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.203.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.203.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.203.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.204.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.204.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.204.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.205.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.205.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.205.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.206.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.206.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.206.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.207.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.207.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.207.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.208.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.208.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.208.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.209.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.209.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.209.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.21.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.21.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.21.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.210.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.210.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.210.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.211.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.211.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.211.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.212.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.212.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.212.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.213.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.213.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.213.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.214.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.214.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.214.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.215.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.215.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.215.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.216.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.216.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.216.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.217.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.217.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.217.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.218.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.218.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.218.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.219.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.219.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.219.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.22.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.22.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.22.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.220.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.220.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.220.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.221.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.221.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.221.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.222.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.222.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.222.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.223.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.223.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.223.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.224.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.224.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.224.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.225.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.225.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.225.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.226.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.226.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.226.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.227.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.227.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.227.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.228.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.228.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.228.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.229.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.229.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.229.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.23.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.23.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.23.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.230.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.230.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.230.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.231.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.231.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.231.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.232.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.232.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.232.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.233.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.233.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.233.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.234.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.234.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.234.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.235.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.235.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.235.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.236.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.236.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.236.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.237.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.237.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.237.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.238.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.238.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.238.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.239.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.239.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.239.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.24.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.24.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.24.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.240.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.240.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.240.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.241.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.241.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.241.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.242.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.242.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.242.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.243.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.243.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.243.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.244.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.244.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.244.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.245.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.245.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.245.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.246.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.246.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.246.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.247.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.247.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.247.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.248.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.248.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.248.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.249.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.249.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.249.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.25.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.25.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.25.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.250.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.250.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.250.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.251.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.251.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.251.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.252.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.252.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.252.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.253.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.253.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.253.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.254.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.254.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.254.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.255.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.255.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.255.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.26.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.26.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.26.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.27.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.27.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.27.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.28.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.28.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.28.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.29.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.29.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.29.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.3.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.3.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.3.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.30.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.30.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.30.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.31.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.31.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.31.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.32.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.32.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.32.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.33.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.33.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.33.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.34.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.34.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.34.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.35.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.35.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.35.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.36.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.36.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.36.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.37.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.37.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.37.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.38.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.38.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.38.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.39.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.39.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.39.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.4.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.4.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.4.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.40.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.40.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.40.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.41.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.41.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.41.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.42.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.42.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.42.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.43.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.43.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.43.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.44.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.44.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.44.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.45.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.45.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.45.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.46.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.46.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.46.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.47.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.47.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.47.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.48.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.48.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.48.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.49.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.49.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.49.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.5.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.5.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.5.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.50.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.50.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.50.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.51.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.51.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.51.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.52.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.52.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.52.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.53.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.53.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.53.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.54.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.54.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.54.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.55.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.55.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.55.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.56.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.56.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.56.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.57.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.57.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.57.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.58.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.58.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.58.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.59.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.59.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.59.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.6.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.6.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.6.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.60.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.60.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.60.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.61.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.61.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.61.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.62.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.62.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.62.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.63.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.63.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.63.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.64.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.64.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.64.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.65.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.65.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.65.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.66.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.66.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.66.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.67.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.67.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.67.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.68.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.68.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.68.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.69.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.69.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.69.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.7.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.7.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.7.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.70.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.70.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.70.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.71.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.71.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.71.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.72.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.72.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.72.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.73.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.73.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.73.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.74.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.74.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.74.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.75.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.75.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.75.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.76.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.76.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.76.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.77.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.77.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.77.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.78.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.78.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.78.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.79.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.79.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.79.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.8.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.8.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.8.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.80.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.80.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.80.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.81.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.81.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.81.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.82.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.82.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.82.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.83.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.83.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.83.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.84.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.84.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.84.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.85.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.85.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.85.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.86.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.86.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.86.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.87.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.87.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.87.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.88.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.88.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.88.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.89.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.89.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.89.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.9.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.9.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.9.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.90.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.90.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.90.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.91.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.91.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.91.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.92.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.92.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.92.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.93.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.93.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.93.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.94.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.94.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.94.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.95.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.95.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.95.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.96.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.96.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.96.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.97.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.97.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.97.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.98.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.98.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.98.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.99.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.99.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.experts.gate_up_proj_list.99.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.gate.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.shared_expert.down_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.shared_expert.down_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.shared_expert.down_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.shared_expert.gate_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.shared_expert.gate_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.shared_expert.gate_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.shared_expert.up_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.shared_expert.up_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.shared_expert.up_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.shared_expert_gate.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.shared_expert_gate.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.20.mlp.shared_expert_gate.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.20.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.21.input_layernorm.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.21.linear_attn.A_log": "model-00002-of-00004.safetensors", "model.language_model.layers.21.linear_attn.conv1d.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.21.linear_attn.dt_bias": "model-00002-of-00004.safetensors", "model.language_model.layers.21.linear_attn.in_proj_a.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.linear_attn.in_proj_a.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.linear_attn.in_proj_a.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.linear_attn.in_proj_b.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.linear_attn.in_proj_b.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.linear_attn.in_proj_b.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.linear_attn.in_proj_qkv.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.linear_attn.in_proj_qkv.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.linear_attn.in_proj_qkv.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.linear_attn.in_proj_z.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.linear_attn.in_proj_z.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.linear_attn.in_proj_z.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.linear_attn.norm.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.21.linear_attn.out_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.linear_attn.out_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.linear_attn.out_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.0.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.0.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.0.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.1.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.1.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.1.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.10.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.10.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.10.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.100.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.100.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.100.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.101.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.101.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.101.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.102.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.102.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.102.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.103.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.103.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.103.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.104.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.104.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.104.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.105.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.105.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.105.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.106.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.106.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.106.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.107.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.107.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.107.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.108.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.108.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.108.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.109.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.109.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.109.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.11.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.11.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.11.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.110.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.110.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.110.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.111.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.111.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.111.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.112.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.112.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.112.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.113.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.113.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.113.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.114.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.114.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.114.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.115.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.115.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.115.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.116.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.116.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.116.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.117.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.117.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.117.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.118.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.118.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.118.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.119.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.119.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.119.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.12.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.12.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.12.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.120.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.120.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.120.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.121.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.121.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.121.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.122.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.122.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.122.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.123.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.123.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.123.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.124.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.124.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.124.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.125.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.125.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.125.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.126.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.126.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.126.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.127.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.127.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.127.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.128.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.128.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.128.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.129.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.129.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.129.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.13.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.13.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.13.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.130.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.130.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.130.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.131.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.131.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.131.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.132.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.132.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.132.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.133.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.133.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.133.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.134.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.134.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.134.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.135.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.135.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.135.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.136.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.136.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.136.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.137.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.137.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.137.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.138.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.138.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.138.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.139.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.139.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.139.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.14.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.14.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.14.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.140.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.140.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.140.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.141.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.141.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.141.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.142.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.142.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.142.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.143.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.143.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.143.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.144.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.144.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.144.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.145.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.145.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.145.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.146.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.146.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.146.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.147.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.147.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.147.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.148.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.148.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.148.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.149.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.149.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.149.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.15.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.15.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.15.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.150.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.150.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.150.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.151.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.151.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.151.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.152.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.152.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.152.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.153.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.153.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.153.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.154.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.154.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.154.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.155.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.155.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.155.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.156.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.156.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.156.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.157.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.157.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.157.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.158.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.158.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.158.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.159.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.159.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.159.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.16.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.16.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.16.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.160.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.160.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.160.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.161.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.161.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.161.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.162.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.162.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.162.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.163.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.163.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.163.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.164.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.164.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.164.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.165.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.165.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.165.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.166.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.166.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.166.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.167.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.167.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.167.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.168.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.168.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.168.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.169.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.169.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.169.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.17.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.17.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.17.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.170.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.170.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.170.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.171.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.171.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.171.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.172.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.172.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.172.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.173.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.173.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.173.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.174.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.174.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.174.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.175.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.175.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.175.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.176.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.176.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.176.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.177.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.177.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.177.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.178.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.178.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.178.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.179.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.179.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.179.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.18.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.18.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.18.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.180.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.180.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.180.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.181.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.181.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.181.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.182.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.182.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.182.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.183.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.183.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.183.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.184.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.184.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.184.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.185.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.185.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.185.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.186.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.186.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.186.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.187.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.187.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.187.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.188.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.188.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.188.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.189.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.189.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.189.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.19.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.19.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.19.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.190.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.190.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.190.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.191.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.191.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.191.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.192.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.192.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.192.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.193.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.193.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.193.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.194.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.194.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.194.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.195.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.195.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.195.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.196.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.196.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.196.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.197.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.197.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.197.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.198.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.198.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.198.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.199.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.199.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.199.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.2.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.2.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.2.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.20.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.20.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.20.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.200.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.200.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.200.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.201.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.201.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.201.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.202.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.202.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.202.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.203.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.203.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.203.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.204.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.204.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.204.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.205.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.205.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.205.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.206.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.206.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.206.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.207.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.207.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.207.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.208.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.208.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.208.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.209.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.209.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.209.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.21.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.21.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.21.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.210.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.210.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.210.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.211.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.211.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.211.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.212.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.212.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.212.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.213.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.213.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.213.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.214.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.214.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.214.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.215.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.215.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.215.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.216.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.216.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.216.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.217.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.217.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.217.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.218.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.218.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.218.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.219.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.219.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.219.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.22.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.22.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.22.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.220.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.220.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.220.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.221.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.221.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.221.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.222.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.222.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.222.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.223.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.223.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.223.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.224.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.224.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.224.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.225.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.225.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.225.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.226.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.226.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.226.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.227.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.227.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.227.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.228.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.228.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.228.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.229.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.229.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.229.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.23.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.23.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.23.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.230.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.230.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.230.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.231.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.231.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.231.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.232.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.232.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.232.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.233.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.233.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.233.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.234.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.234.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.234.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.235.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.235.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.235.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.236.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.236.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.236.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.237.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.237.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.237.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.238.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.238.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.238.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.239.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.239.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.239.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.24.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.24.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.24.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.240.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.240.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.240.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.241.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.241.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.241.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.242.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.242.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.242.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.243.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.243.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.243.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.244.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.244.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.244.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.245.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.245.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.245.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.246.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.246.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.246.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.247.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.247.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.247.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.248.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.248.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.248.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.249.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.249.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.249.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.25.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.25.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.25.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.250.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.250.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.250.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.251.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.251.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.251.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.252.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.252.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.252.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.253.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.253.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.253.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.254.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.254.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.254.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.255.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.255.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.255.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.26.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.26.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.26.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.27.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.27.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.27.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.28.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.28.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.28.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.29.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.29.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.29.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.3.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.3.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.3.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.30.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.30.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.30.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.31.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.31.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.31.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.32.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.32.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.32.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.33.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.33.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.33.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.34.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.34.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.34.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.35.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.35.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.35.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.36.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.36.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.36.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.37.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.37.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.37.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.38.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.38.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.38.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.39.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.39.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.39.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.4.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.4.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.4.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.40.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.40.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.40.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.41.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.41.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.41.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.42.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.42.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.42.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.43.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.43.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.43.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.44.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.44.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.44.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.45.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.45.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.45.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.46.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.46.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.46.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.47.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.47.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.47.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.48.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.48.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.48.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.49.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.49.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.49.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.5.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.5.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.5.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.50.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.50.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.50.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.51.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.51.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.51.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.52.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.52.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.52.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.53.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.53.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.53.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.54.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.54.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.54.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.55.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.55.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.55.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.56.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.56.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.56.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.57.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.57.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.57.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.58.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.58.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.58.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.59.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.59.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.59.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.6.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.6.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.6.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.60.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.60.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.60.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.61.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.61.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.61.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.62.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.62.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.62.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.63.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.63.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.63.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.64.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.64.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.64.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.65.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.65.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.65.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.66.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.66.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.66.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.67.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.67.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.67.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.68.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.68.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.68.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.69.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.69.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.69.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.7.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.7.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.7.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.70.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.70.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.70.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.71.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.71.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.71.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.72.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.72.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.72.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.73.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.73.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.73.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.74.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.74.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.74.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.75.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.75.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.75.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.76.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.76.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.76.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.77.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.77.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.77.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.78.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.78.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.78.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.79.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.79.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.79.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.8.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.8.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.8.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.80.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.80.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.80.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.81.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.81.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.81.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.82.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.82.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.82.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.83.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.83.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.83.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.84.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.84.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.84.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.85.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.85.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.85.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.86.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.86.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.86.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.87.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.87.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.87.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.88.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.88.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.88.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.89.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.89.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.89.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.9.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.9.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.9.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.90.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.90.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.90.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.91.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.91.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.91.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.92.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.92.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.92.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.93.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.93.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.93.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.94.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.94.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.94.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.95.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.95.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.95.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.96.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.96.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.96.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.97.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.97.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.97.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.98.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.98.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.98.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.99.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.99.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.down_proj_list.99.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.0.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.0.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.0.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.1.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.1.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.1.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.10.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.10.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.10.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.100.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.100.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.100.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.101.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.101.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.101.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.102.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.102.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.102.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.103.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.103.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.103.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.104.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.104.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.104.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.105.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.105.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.105.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.106.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.106.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.106.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.107.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.107.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.107.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.108.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.108.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.108.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.109.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.109.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.109.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.11.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.11.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.11.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.110.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.110.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.110.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.111.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.111.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.111.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.112.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.112.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.112.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.113.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.113.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.113.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.114.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.114.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.114.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.115.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.115.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.115.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.116.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.116.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.116.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.117.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.117.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.117.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.118.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.118.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.118.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.119.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.119.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.119.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.12.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.12.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.12.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.120.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.120.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.120.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.121.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.121.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.121.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.122.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.122.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.122.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.123.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.123.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.123.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.124.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.124.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.124.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.125.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.125.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.125.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.126.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.126.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.126.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.127.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.127.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.127.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.128.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.128.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.128.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.129.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.129.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.129.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.13.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.13.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.13.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.130.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.130.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.130.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.131.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.131.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.131.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.132.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.132.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.132.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.133.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.133.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.133.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.134.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.134.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.134.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.135.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.135.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.135.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.136.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.136.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.136.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.137.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.137.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.137.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.138.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.138.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.138.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.139.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.139.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.139.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.14.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.14.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.14.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.140.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.140.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.140.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.141.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.141.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.141.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.142.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.142.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.142.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.143.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.143.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.143.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.144.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.144.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.144.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.145.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.145.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.145.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.146.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.146.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.146.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.147.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.147.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.147.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.148.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.148.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.148.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.149.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.149.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.149.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.15.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.15.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.15.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.150.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.150.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.150.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.151.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.151.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.151.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.152.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.152.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.152.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.153.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.153.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.153.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.154.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.154.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.154.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.155.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.155.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.155.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.156.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.156.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.156.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.157.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.157.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.157.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.158.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.158.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.158.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.159.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.159.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.159.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.16.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.16.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.16.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.160.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.160.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.160.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.161.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.161.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.161.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.162.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.162.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.162.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.163.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.163.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.163.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.164.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.164.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.164.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.165.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.165.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.165.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.166.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.166.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.166.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.167.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.167.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.167.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.168.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.168.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.168.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.169.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.169.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.169.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.17.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.17.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.17.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.170.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.170.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.170.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.171.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.171.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.171.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.172.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.172.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.172.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.173.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.173.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.173.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.174.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.174.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.174.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.175.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.175.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.175.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.176.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.176.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.176.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.177.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.177.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.177.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.178.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.178.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.178.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.179.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.179.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.179.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.18.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.18.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.18.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.180.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.180.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.180.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.181.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.181.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.181.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.182.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.182.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.182.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.183.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.183.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.183.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.184.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.184.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.184.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.185.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.185.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.185.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.186.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.186.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.186.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.187.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.187.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.187.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.188.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.188.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.188.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.189.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.189.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.189.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.19.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.19.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.19.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.190.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.190.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.190.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.191.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.191.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.191.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.192.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.192.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.192.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.193.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.193.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.193.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.194.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.194.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.194.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.195.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.195.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.195.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.196.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.196.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.196.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.197.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.197.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.197.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.198.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.198.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.198.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.199.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.199.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.199.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.2.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.2.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.2.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.20.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.20.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.20.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.200.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.200.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.200.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.201.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.201.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.201.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.202.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.202.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.202.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.203.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.203.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.203.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.204.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.204.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.204.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.205.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.205.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.205.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.206.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.206.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.206.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.207.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.207.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.207.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.208.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.208.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.208.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.209.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.209.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.209.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.21.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.21.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.21.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.210.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.210.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.210.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.211.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.211.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.211.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.212.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.212.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.212.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.213.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.213.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.213.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.214.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.214.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.214.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.215.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.215.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.215.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.216.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.216.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.216.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.217.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.217.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.217.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.218.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.218.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.218.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.219.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.219.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.219.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.22.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.22.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.22.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.220.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.220.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.220.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.221.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.221.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.221.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.222.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.222.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.222.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.223.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.223.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.223.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.224.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.224.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.224.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.225.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.225.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.225.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.226.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.226.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.226.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.227.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.227.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.227.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.228.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.228.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.228.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.229.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.229.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.229.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.23.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.23.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.23.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.230.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.230.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.230.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.231.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.231.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.231.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.232.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.232.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.232.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.233.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.233.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.233.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.234.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.234.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.234.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.235.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.235.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.235.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.236.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.236.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.236.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.237.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.237.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.237.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.238.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.238.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.238.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.239.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.239.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.239.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.24.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.24.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.24.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.240.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.240.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.240.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.241.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.241.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.241.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.242.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.242.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.242.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.243.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.243.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.243.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.244.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.244.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.244.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.245.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.245.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.245.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.246.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.246.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.246.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.247.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.247.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.247.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.248.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.248.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.248.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.249.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.249.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.249.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.25.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.25.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.25.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.250.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.250.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.250.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.251.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.251.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.251.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.252.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.252.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.252.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.253.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.253.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.253.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.254.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.254.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.254.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.255.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.255.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.255.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.26.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.26.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.26.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.27.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.27.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.27.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.28.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.28.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.28.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.29.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.29.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.29.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.3.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.3.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.3.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.30.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.30.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.30.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.31.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.31.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.31.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.32.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.32.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.32.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.33.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.33.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.33.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.34.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.34.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.34.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.35.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.35.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.35.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.36.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.36.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.36.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.37.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.37.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.37.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.38.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.38.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.38.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.39.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.39.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.39.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.4.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.4.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.4.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.40.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.40.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.40.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.41.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.41.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.41.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.42.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.42.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.42.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.43.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.43.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.43.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.44.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.44.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.44.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.45.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.45.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.45.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.46.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.46.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.46.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.47.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.47.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.47.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.48.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.48.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.48.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.49.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.49.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.49.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.5.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.5.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.5.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.50.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.50.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.50.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.51.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.51.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.51.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.52.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.52.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.52.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.53.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.53.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.53.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.54.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.54.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.54.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.55.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.55.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.55.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.56.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.56.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.56.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.57.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.57.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.57.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.58.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.58.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.58.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.59.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.59.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.59.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.6.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.6.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.6.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.60.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.60.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.60.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.61.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.61.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.61.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.62.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.62.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.62.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.63.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.63.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.63.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.64.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.64.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.64.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.65.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.65.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.65.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.66.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.66.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.66.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.67.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.67.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.67.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.68.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.68.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.68.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.69.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.69.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.69.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.7.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.7.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.7.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.70.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.70.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.70.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.71.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.71.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.71.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.72.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.72.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.72.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.73.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.73.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.73.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.74.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.74.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.74.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.75.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.75.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.75.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.76.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.76.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.76.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.77.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.77.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.77.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.78.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.78.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.78.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.79.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.79.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.79.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.8.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.8.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.8.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.80.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.80.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.80.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.81.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.81.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.81.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.82.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.82.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.82.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.83.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.83.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.83.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.84.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.84.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.84.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.85.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.85.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.85.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.86.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.86.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.86.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.87.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.87.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.87.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.88.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.88.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.88.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.89.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.89.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.89.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.9.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.9.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.9.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.90.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.90.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.90.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.91.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.91.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.91.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.92.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.92.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.92.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.93.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.93.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.93.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.94.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.94.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.94.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.95.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.95.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.95.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.96.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.96.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.96.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.97.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.97.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.97.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.98.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.98.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.98.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.99.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.99.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.experts.gate_up_proj_list.99.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.gate.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.shared_expert.down_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.shared_expert.down_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.shared_expert.down_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.shared_expert.gate_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.shared_expert.gate_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.shared_expert.gate_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.shared_expert.up_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.shared_expert.up_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.shared_expert.up_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.shared_expert_gate.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.shared_expert_gate.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.21.mlp.shared_expert_gate.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.21.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.22.input_layernorm.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.22.linear_attn.A_log": "model-00002-of-00004.safetensors", "model.language_model.layers.22.linear_attn.conv1d.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.22.linear_attn.dt_bias": "model-00002-of-00004.safetensors", "model.language_model.layers.22.linear_attn.in_proj_a.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.linear_attn.in_proj_a.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.linear_attn.in_proj_a.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.linear_attn.in_proj_b.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.linear_attn.in_proj_b.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.linear_attn.in_proj_b.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.linear_attn.in_proj_qkv.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.linear_attn.in_proj_qkv.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.linear_attn.in_proj_qkv.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.linear_attn.in_proj_z.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.linear_attn.in_proj_z.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.linear_attn.in_proj_z.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.linear_attn.norm.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.22.linear_attn.out_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.linear_attn.out_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.linear_attn.out_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.0.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.0.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.0.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.1.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.1.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.1.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.10.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.10.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.10.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.100.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.100.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.100.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.101.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.101.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.101.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.102.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.102.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.102.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.103.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.103.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.103.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.104.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.104.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.104.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.105.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.105.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.105.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.106.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.106.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.106.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.107.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.107.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.107.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.108.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.108.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.108.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.109.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.109.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.109.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.11.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.11.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.11.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.110.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.110.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.110.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.111.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.111.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.111.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.112.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.112.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.112.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.113.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.113.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.113.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.114.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.114.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.114.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.115.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.115.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.115.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.116.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.116.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.116.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.117.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.117.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.117.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.118.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.118.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.118.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.119.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.119.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.119.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.12.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.12.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.12.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.120.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.120.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.120.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.121.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.121.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.121.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.122.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.122.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.122.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.123.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.123.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.123.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.124.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.124.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.124.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.125.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.125.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.125.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.126.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.126.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.126.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.127.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.127.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.127.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.128.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.128.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.128.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.129.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.129.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.129.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.13.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.13.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.13.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.130.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.130.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.130.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.131.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.131.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.131.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.132.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.132.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.132.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.133.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.133.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.133.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.134.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.134.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.134.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.135.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.135.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.135.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.136.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.136.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.136.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.137.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.137.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.137.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.138.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.138.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.138.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.139.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.139.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.139.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.14.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.14.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.14.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.140.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.140.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.140.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.141.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.141.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.141.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.142.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.142.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.142.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.143.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.143.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.143.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.144.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.144.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.144.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.145.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.145.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.145.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.146.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.146.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.146.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.147.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.147.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.147.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.148.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.148.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.148.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.149.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.149.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.149.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.15.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.15.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.15.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.150.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.150.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.150.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.151.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.151.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.151.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.152.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.152.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.152.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.153.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.153.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.153.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.154.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.154.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.154.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.155.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.155.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.155.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.156.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.156.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.156.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.157.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.157.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.157.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.158.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.158.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.158.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.159.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.159.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.159.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.16.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.16.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.16.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.160.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.160.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.160.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.161.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.161.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.161.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.162.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.162.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.162.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.163.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.163.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.163.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.164.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.164.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.164.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.165.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.165.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.165.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.166.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.166.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.166.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.167.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.167.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.167.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.168.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.168.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.168.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.169.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.169.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.169.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.17.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.17.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.17.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.170.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.170.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.170.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.171.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.171.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.171.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.172.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.172.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.172.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.173.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.173.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.173.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.174.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.174.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.174.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.175.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.175.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.175.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.176.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.176.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.176.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.177.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.177.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.177.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.178.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.178.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.178.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.179.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.179.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.179.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.18.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.18.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.18.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.180.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.180.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.180.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.181.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.181.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.181.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.182.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.182.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.182.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.183.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.183.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.183.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.184.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.184.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.184.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.185.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.185.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.185.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.186.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.186.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.186.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.187.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.187.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.187.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.188.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.188.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.188.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.189.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.189.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.189.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.19.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.19.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.19.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.190.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.190.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.190.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.191.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.191.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.191.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.192.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.192.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.192.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.193.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.193.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.193.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.194.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.194.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.194.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.195.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.195.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.195.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.196.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.196.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.196.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.197.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.197.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.197.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.198.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.198.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.198.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.199.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.199.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.199.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.2.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.2.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.2.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.20.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.20.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.20.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.200.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.200.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.200.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.201.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.201.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.201.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.202.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.202.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.202.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.203.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.203.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.203.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.204.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.204.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.204.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.205.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.205.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.205.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.206.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.206.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.206.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.207.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.207.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.207.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.208.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.208.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.208.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.209.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.209.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.209.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.21.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.21.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.21.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.210.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.210.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.210.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.211.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.211.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.211.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.212.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.212.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.212.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.213.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.213.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.213.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.214.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.214.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.214.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.215.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.215.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.215.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.216.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.216.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.216.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.217.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.217.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.217.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.218.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.218.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.218.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.219.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.219.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.219.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.22.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.22.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.22.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.220.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.220.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.220.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.221.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.221.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.221.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.222.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.222.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.222.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.223.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.223.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.223.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.224.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.224.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.224.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.225.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.225.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.225.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.226.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.226.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.226.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.227.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.227.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.227.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.228.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.228.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.228.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.229.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.229.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.229.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.23.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.23.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.23.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.230.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.230.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.230.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.231.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.231.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.231.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.232.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.232.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.232.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.233.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.233.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.233.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.234.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.234.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.234.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.235.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.235.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.235.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.236.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.236.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.236.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.237.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.237.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.237.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.238.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.238.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.238.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.239.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.239.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.239.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.24.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.24.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.24.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.240.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.240.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.240.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.241.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.241.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.241.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.242.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.242.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.242.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.243.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.243.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.243.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.244.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.244.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.244.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.245.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.245.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.245.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.246.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.246.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.246.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.247.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.247.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.247.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.248.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.248.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.248.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.249.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.249.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.249.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.25.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.25.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.25.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.250.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.250.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.250.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.251.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.251.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.251.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.252.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.252.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.252.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.253.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.253.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.253.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.254.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.254.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.254.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.255.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.255.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.255.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.26.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.26.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.26.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.27.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.27.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.27.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.28.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.28.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.28.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.29.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.29.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.29.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.3.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.3.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.3.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.30.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.30.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.30.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.31.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.31.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.31.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.32.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.32.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.32.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.33.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.33.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.33.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.34.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.34.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.34.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.35.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.35.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.35.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.36.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.36.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.36.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.37.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.37.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.37.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.38.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.38.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.38.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.39.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.39.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.39.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.4.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.4.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.4.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.40.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.40.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.40.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.41.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.41.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.41.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.42.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.42.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.42.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.43.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.43.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.43.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.44.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.44.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.44.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.45.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.45.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.45.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.46.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.46.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.46.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.47.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.47.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.47.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.48.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.48.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.48.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.49.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.49.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.49.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.5.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.5.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.5.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.50.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.50.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.50.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.51.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.51.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.51.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.52.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.52.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.52.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.53.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.53.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.53.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.54.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.54.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.54.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.55.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.55.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.55.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.56.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.56.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.56.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.57.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.57.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.57.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.58.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.58.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.58.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.59.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.59.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.59.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.6.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.6.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.6.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.60.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.60.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.60.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.61.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.61.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.61.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.62.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.62.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.62.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.63.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.63.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.63.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.64.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.64.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.64.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.65.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.65.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.65.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.66.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.66.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.66.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.67.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.67.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.67.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.68.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.68.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.68.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.69.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.69.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.69.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.7.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.7.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.7.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.70.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.70.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.70.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.71.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.71.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.71.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.72.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.72.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.72.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.73.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.73.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.73.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.74.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.74.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.74.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.75.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.75.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.75.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.76.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.76.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.76.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.77.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.77.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.77.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.78.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.78.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.78.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.79.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.79.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.79.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.8.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.8.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.8.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.80.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.80.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.80.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.81.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.81.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.81.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.82.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.82.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.82.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.83.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.83.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.83.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.84.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.84.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.84.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.85.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.85.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.85.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.86.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.86.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.86.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.87.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.87.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.87.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.88.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.88.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.88.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.89.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.89.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.89.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.9.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.9.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.9.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.90.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.90.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.90.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.91.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.91.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.91.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.92.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.92.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.92.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.93.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.93.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.93.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.94.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.94.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.94.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.95.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.95.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.95.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.96.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.96.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.96.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.97.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.97.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.97.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.98.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.98.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.98.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.99.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.99.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.down_proj_list.99.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.0.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.0.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.0.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.1.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.1.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.1.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.10.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.10.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.10.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.100.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.100.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.100.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.101.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.101.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.101.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.102.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.102.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.102.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.103.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.103.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.103.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.104.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.104.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.104.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.105.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.105.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.105.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.106.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.106.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.106.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.107.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.107.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.107.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.108.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.108.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.108.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.109.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.109.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.109.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.11.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.11.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.11.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.110.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.110.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.110.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.111.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.111.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.111.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.112.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.112.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.112.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.113.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.113.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.113.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.114.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.114.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.114.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.115.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.115.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.115.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.116.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.116.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.116.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.117.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.117.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.117.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.118.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.118.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.118.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.119.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.119.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.119.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.12.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.12.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.12.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.120.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.120.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.120.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.121.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.121.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.121.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.122.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.122.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.122.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.123.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.123.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.123.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.124.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.124.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.124.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.125.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.125.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.125.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.126.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.126.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.126.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.127.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.127.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.127.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.128.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.128.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.128.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.129.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.129.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.129.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.13.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.13.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.13.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.130.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.130.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.130.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.131.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.131.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.131.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.132.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.132.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.132.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.133.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.133.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.133.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.134.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.134.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.134.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.135.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.135.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.135.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.136.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.136.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.136.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.137.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.137.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.137.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.138.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.138.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.138.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.139.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.139.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.139.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.14.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.14.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.14.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.140.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.140.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.140.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.141.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.141.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.141.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.142.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.142.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.142.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.143.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.143.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.143.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.144.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.144.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.144.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.145.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.145.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.145.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.146.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.146.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.146.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.147.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.147.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.147.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.148.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.148.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.148.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.149.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.149.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.149.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.15.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.15.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.15.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.150.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.150.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.150.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.151.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.151.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.151.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.152.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.152.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.152.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.153.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.153.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.153.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.154.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.154.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.154.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.155.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.155.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.155.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.156.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.156.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.156.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.157.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.157.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.157.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.158.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.158.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.158.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.159.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.159.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.159.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.16.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.16.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.16.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.160.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.160.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.160.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.161.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.161.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.161.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.162.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.162.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.162.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.163.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.163.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.163.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.164.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.164.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.164.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.165.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.165.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.165.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.166.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.166.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.166.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.167.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.167.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.167.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.168.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.168.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.168.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.169.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.169.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.169.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.17.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.17.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.17.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.170.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.170.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.170.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.171.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.171.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.171.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.172.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.172.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.172.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.173.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.173.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.173.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.174.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.174.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.174.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.175.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.175.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.175.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.176.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.176.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.176.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.177.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.177.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.177.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.178.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.178.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.178.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.179.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.179.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.179.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.18.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.18.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.18.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.180.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.180.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.180.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.181.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.181.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.181.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.182.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.182.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.182.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.183.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.183.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.183.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.184.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.184.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.184.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.185.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.185.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.185.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.186.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.186.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.186.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.187.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.187.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.187.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.188.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.188.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.188.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.189.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.189.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.189.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.19.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.19.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.19.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.190.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.190.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.190.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.191.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.191.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.191.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.192.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.192.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.192.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.193.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.193.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.193.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.194.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.194.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.194.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.195.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.195.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.195.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.196.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.196.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.196.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.197.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.197.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.197.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.198.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.198.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.198.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.199.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.199.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.199.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.2.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.2.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.2.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.20.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.20.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.20.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.200.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.200.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.200.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.201.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.201.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.201.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.202.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.202.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.202.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.203.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.203.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.203.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.204.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.204.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.204.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.205.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.205.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.205.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.206.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.206.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.206.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.207.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.207.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.207.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.208.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.208.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.208.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.209.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.209.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.209.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.21.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.21.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.21.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.210.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.210.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.210.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.211.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.211.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.211.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.212.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.212.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.212.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.213.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.213.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.213.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.214.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.214.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.214.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.215.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.215.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.215.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.216.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.216.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.216.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.217.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.217.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.217.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.218.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.218.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.218.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.219.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.219.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.219.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.22.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.22.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.22.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.220.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.220.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.220.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.221.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.221.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.221.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.222.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.222.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.222.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.223.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.223.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.223.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.224.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.224.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.224.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.225.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.225.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.225.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.226.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.226.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.226.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.227.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.227.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.227.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.228.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.228.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.228.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.229.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.229.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.229.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.23.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.23.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.23.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.230.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.230.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.230.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.231.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.231.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.231.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.232.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.232.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.232.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.233.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.233.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.233.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.234.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.234.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.234.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.235.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.235.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.235.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.236.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.236.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.236.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.237.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.237.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.237.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.238.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.238.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.238.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.239.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.239.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.239.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.24.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.24.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.24.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.240.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.240.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.240.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.241.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.241.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.241.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.242.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.242.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.242.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.243.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.243.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.243.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.244.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.244.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.244.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.245.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.245.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.245.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.246.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.246.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.246.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.247.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.247.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.247.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.248.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.248.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.248.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.249.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.249.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.249.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.25.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.25.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.25.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.250.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.250.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.250.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.251.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.251.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.251.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.252.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.252.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.252.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.253.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.253.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.253.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.254.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.254.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.254.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.255.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.255.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.255.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.26.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.26.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.26.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.27.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.27.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.27.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.28.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.28.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.28.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.29.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.29.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.29.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.3.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.3.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.3.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.30.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.30.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.30.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.31.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.31.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.31.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.32.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.32.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.32.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.33.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.33.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.33.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.34.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.34.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.34.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.35.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.35.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.35.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.36.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.36.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.36.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.37.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.37.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.37.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.38.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.38.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.38.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.39.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.39.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.39.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.4.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.4.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.4.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.40.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.40.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.40.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.41.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.41.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.41.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.42.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.42.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.42.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.43.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.43.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.43.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.44.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.44.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.44.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.45.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.45.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.45.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.46.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.46.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.46.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.47.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.47.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.47.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.48.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.48.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.48.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.49.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.49.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.49.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.5.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.5.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.5.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.50.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.50.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.50.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.51.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.51.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.51.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.52.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.52.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.52.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.53.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.53.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.53.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.54.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.54.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.54.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.55.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.55.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.55.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.56.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.56.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.56.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.57.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.57.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.57.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.58.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.58.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.58.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.59.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.59.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.59.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.6.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.6.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.6.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.60.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.60.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.60.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.61.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.61.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.61.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.62.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.62.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.62.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.63.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.63.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.63.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.64.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.64.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.64.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.65.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.65.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.65.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.66.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.66.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.66.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.67.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.67.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.67.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.68.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.68.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.68.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.69.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.69.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.69.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.7.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.7.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.7.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.70.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.70.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.70.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.71.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.71.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.71.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.72.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.72.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.72.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.73.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.73.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.73.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.74.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.74.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.74.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.75.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.75.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.75.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.76.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.76.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.76.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.77.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.77.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.77.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.78.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.78.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.78.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.79.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.79.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.79.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.8.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.8.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.8.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.80.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.80.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.80.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.81.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.81.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.81.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.82.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.82.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.82.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.83.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.83.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.83.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.84.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.84.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.84.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.85.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.85.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.85.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.86.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.86.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.86.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.87.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.87.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.87.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.88.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.88.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.88.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.89.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.89.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.89.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.9.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.9.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.9.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.90.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.90.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.90.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.91.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.91.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.91.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.92.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.92.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.92.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.93.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.93.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.93.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.94.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.94.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.94.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.95.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.95.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.95.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.96.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.96.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.96.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.97.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.97.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.97.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.98.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.98.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.98.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.99.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.99.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.experts.gate_up_proj_list.99.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.gate.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.22.mlp.shared_expert.down_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.shared_expert.down_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.shared_expert.down_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.shared_expert.gate_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.shared_expert.gate_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.shared_expert.gate_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.shared_expert.up_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.shared_expert.up_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.shared_expert.up_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.shared_expert_gate.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.shared_expert_gate.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.22.mlp.shared_expert_gate.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.22.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.23.input_layernorm.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.0.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.0.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.0.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.1.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.1.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.1.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.10.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.10.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.10.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.100.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.100.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.100.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.101.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.101.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.101.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.102.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.102.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.102.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.103.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.103.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.103.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.104.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.104.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.104.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.105.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.105.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.105.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.106.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.106.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.106.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.107.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.107.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.107.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.108.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.108.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.108.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.109.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.109.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.109.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.11.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.11.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.11.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.110.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.110.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.110.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.111.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.111.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.111.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.112.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.112.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.112.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.113.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.113.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.113.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.114.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.114.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.114.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.115.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.115.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.115.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.116.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.116.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.116.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.117.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.117.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.117.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.118.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.118.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.118.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.119.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.119.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.119.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.12.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.12.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.12.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.120.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.120.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.120.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.121.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.121.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.121.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.122.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.122.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.122.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.123.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.123.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.123.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.124.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.124.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.124.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.125.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.125.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.125.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.126.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.126.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.126.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.127.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.127.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.127.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.128.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.128.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.128.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.129.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.129.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.129.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.13.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.13.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.13.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.130.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.130.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.130.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.131.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.131.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.131.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.132.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.132.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.132.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.133.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.133.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.133.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.134.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.134.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.134.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.135.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.135.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.135.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.136.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.136.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.136.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.137.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.137.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.137.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.138.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.138.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.138.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.139.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.139.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.139.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.14.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.14.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.14.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.140.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.140.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.140.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.141.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.141.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.141.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.142.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.142.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.142.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.143.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.143.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.143.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.144.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.144.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.144.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.145.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.145.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.145.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.146.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.146.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.146.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.147.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.147.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.147.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.148.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.148.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.148.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.149.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.149.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.149.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.15.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.15.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.15.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.150.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.150.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.150.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.151.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.151.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.151.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.152.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.152.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.152.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.153.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.153.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.153.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.154.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.154.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.154.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.155.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.155.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.155.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.156.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.156.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.156.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.157.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.157.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.157.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.158.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.158.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.158.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.159.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.159.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.159.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.16.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.16.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.16.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.160.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.160.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.160.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.161.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.161.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.161.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.162.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.162.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.162.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.163.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.163.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.163.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.164.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.164.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.164.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.165.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.165.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.165.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.166.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.166.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.166.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.167.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.167.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.167.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.168.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.168.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.168.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.169.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.169.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.169.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.17.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.17.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.17.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.170.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.170.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.170.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.171.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.171.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.171.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.172.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.172.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.172.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.173.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.173.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.173.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.174.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.174.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.174.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.175.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.175.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.175.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.176.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.176.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.176.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.177.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.177.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.177.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.178.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.178.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.178.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.179.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.179.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.179.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.18.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.18.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.18.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.180.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.180.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.180.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.181.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.181.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.181.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.182.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.182.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.182.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.183.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.183.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.183.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.184.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.184.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.184.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.185.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.185.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.185.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.186.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.186.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.186.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.187.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.187.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.187.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.188.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.188.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.188.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.189.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.189.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.189.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.19.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.19.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.19.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.190.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.190.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.190.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.191.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.191.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.191.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.192.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.192.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.192.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.193.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.193.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.193.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.194.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.194.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.194.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.195.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.195.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.195.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.196.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.196.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.196.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.197.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.197.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.197.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.198.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.198.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.198.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.199.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.199.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.199.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.2.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.2.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.2.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.20.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.20.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.20.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.200.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.200.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.200.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.201.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.201.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.201.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.202.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.202.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.202.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.203.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.203.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.203.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.204.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.204.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.204.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.205.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.205.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.205.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.206.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.206.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.206.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.207.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.207.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.207.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.208.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.208.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.208.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.209.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.209.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.209.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.21.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.21.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.21.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.210.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.210.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.210.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.211.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.211.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.211.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.212.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.212.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.212.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.213.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.213.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.213.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.214.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.214.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.214.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.215.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.215.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.215.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.216.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.216.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.216.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.217.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.217.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.217.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.218.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.218.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.218.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.219.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.219.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.219.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.22.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.22.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.22.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.220.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.220.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.220.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.221.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.221.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.221.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.222.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.222.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.222.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.223.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.223.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.223.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.224.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.224.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.224.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.225.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.225.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.225.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.226.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.226.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.226.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.227.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.227.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.227.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.228.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.228.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.228.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.229.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.229.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.229.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.23.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.23.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.23.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.230.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.230.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.230.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.231.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.231.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.231.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.232.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.232.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.232.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.233.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.233.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.233.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.234.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.234.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.234.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.235.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.235.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.235.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.236.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.236.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.236.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.237.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.237.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.237.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.238.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.238.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.238.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.239.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.239.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.239.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.24.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.24.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.24.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.240.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.240.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.240.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.241.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.241.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.241.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.242.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.242.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.242.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.243.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.243.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.243.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.244.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.244.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.244.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.245.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.245.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.245.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.246.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.246.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.246.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.247.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.247.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.247.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.248.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.248.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.248.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.249.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.249.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.249.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.25.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.25.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.25.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.250.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.250.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.250.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.251.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.251.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.251.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.252.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.252.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.252.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.253.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.253.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.253.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.254.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.254.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.254.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.255.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.255.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.255.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.26.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.26.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.26.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.27.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.27.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.27.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.28.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.28.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.28.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.29.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.29.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.29.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.3.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.3.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.3.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.30.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.30.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.30.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.31.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.31.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.31.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.32.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.32.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.32.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.33.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.33.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.33.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.34.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.34.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.34.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.35.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.35.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.35.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.36.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.36.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.36.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.37.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.37.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.37.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.38.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.38.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.38.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.39.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.39.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.39.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.4.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.4.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.4.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.40.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.40.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.40.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.41.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.41.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.41.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.42.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.42.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.42.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.43.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.43.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.43.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.44.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.44.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.44.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.45.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.45.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.45.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.46.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.46.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.46.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.47.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.47.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.47.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.48.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.48.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.48.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.49.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.49.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.49.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.5.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.5.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.5.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.50.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.50.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.50.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.51.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.51.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.51.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.52.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.52.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.52.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.53.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.53.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.53.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.54.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.54.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.54.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.55.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.55.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.55.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.56.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.56.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.56.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.57.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.57.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.57.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.58.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.58.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.58.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.59.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.59.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.59.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.6.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.6.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.6.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.60.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.60.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.60.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.61.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.61.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.61.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.62.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.62.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.62.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.63.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.63.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.63.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.64.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.64.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.64.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.65.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.65.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.65.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.66.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.66.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.66.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.67.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.67.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.67.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.68.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.68.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.68.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.69.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.69.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.69.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.7.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.7.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.7.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.70.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.70.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.70.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.71.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.71.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.71.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.72.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.72.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.72.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.73.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.73.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.73.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.74.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.74.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.74.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.75.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.75.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.75.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.76.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.76.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.76.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.77.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.77.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.77.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.78.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.78.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.78.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.79.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.79.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.79.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.8.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.8.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.8.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.80.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.80.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.80.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.81.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.81.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.81.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.82.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.82.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.82.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.83.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.83.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.83.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.84.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.84.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.84.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.85.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.85.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.85.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.86.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.86.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.86.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.87.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.87.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.87.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.88.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.88.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.88.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.89.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.89.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.89.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.9.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.9.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.9.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.90.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.90.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.90.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.91.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.91.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.91.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.92.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.92.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.92.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.93.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.93.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.93.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.94.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.94.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.94.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.95.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.95.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.95.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.96.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.96.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.96.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.97.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.97.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.97.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.98.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.98.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.98.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.99.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.99.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.down_proj_list.99.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.0.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.0.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.0.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.1.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.1.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.1.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.10.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.10.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.10.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.100.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.100.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.100.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.101.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.101.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.101.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.102.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.102.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.102.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.103.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.103.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.103.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.104.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.104.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.104.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.105.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.105.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.105.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.106.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.106.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.106.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.107.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.107.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.107.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.108.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.108.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.108.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.109.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.109.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.109.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.11.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.11.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.11.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.110.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.110.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.110.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.111.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.111.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.111.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.112.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.112.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.112.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.113.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.113.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.113.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.114.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.114.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.114.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.115.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.115.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.115.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.116.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.116.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.116.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.117.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.117.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.117.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.118.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.118.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.118.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.119.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.119.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.119.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.12.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.12.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.12.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.120.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.120.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.120.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.121.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.121.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.121.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.122.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.122.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.122.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.123.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.123.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.123.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.124.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.124.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.124.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.125.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.125.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.125.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.126.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.126.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.126.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.127.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.127.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.127.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.128.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.128.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.128.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.129.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.129.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.129.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.13.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.13.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.13.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.130.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.130.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.130.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.131.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.131.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.131.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.132.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.132.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.132.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.133.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.133.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.133.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.134.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.134.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.134.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.135.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.135.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.135.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.136.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.136.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.136.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.137.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.137.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.137.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.138.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.138.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.138.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.139.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.139.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.139.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.14.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.14.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.14.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.140.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.140.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.140.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.141.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.141.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.141.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.142.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.142.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.142.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.143.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.143.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.143.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.144.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.144.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.144.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.145.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.145.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.145.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.146.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.146.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.146.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.147.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.147.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.147.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.148.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.148.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.148.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.149.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.149.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.149.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.15.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.15.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.15.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.150.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.150.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.150.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.151.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.151.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.151.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.152.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.152.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.152.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.153.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.153.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.153.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.154.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.154.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.154.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.155.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.155.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.155.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.156.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.156.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.156.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.157.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.157.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.157.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.158.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.158.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.158.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.159.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.159.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.159.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.16.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.16.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.16.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.160.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.160.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.160.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.161.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.161.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.161.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.162.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.162.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.162.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.163.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.163.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.163.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.164.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.164.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.164.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.165.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.165.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.165.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.166.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.166.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.166.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.167.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.167.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.167.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.168.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.168.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.168.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.169.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.169.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.169.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.17.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.17.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.17.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.170.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.170.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.170.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.171.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.171.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.171.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.172.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.172.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.172.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.173.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.173.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.173.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.174.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.174.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.174.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.175.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.175.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.175.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.176.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.176.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.176.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.177.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.177.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.177.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.178.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.178.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.178.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.179.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.179.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.179.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.18.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.18.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.18.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.180.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.180.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.180.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.181.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.181.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.181.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.182.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.182.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.182.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.183.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.183.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.183.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.184.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.184.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.184.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.185.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.185.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.185.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.186.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.186.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.186.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.187.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.187.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.187.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.188.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.188.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.188.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.189.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.189.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.189.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.19.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.19.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.19.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.190.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.190.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.190.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.191.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.191.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.191.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.192.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.192.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.192.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.193.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.193.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.193.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.194.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.194.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.194.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.195.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.195.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.195.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.196.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.196.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.196.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.197.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.197.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.197.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.198.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.198.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.198.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.199.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.199.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.199.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.2.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.2.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.2.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.20.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.20.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.20.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.200.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.200.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.200.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.201.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.201.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.201.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.202.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.202.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.202.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.203.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.203.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.203.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.204.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.204.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.204.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.205.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.205.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.205.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.206.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.206.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.206.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.207.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.207.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.207.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.208.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.208.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.208.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.209.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.209.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.209.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.21.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.21.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.21.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.210.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.210.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.210.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.211.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.211.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.211.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.212.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.212.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.212.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.213.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.213.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.213.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.214.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.214.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.214.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.215.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.215.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.215.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.216.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.216.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.216.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.217.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.217.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.217.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.218.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.218.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.218.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.219.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.219.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.219.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.22.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.22.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.22.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.220.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.220.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.220.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.221.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.221.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.221.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.222.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.222.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.222.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.223.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.223.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.223.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.224.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.224.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.224.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.225.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.225.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.225.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.226.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.226.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.226.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.227.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.227.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.227.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.228.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.228.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.228.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.229.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.229.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.229.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.23.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.23.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.23.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.230.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.230.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.230.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.231.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.231.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.231.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.232.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.232.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.232.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.233.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.233.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.233.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.234.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.234.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.234.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.235.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.235.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.235.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.236.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.236.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.236.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.237.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.237.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.237.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.238.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.238.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.238.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.239.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.239.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.239.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.24.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.24.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.24.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.240.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.240.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.240.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.241.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.241.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.241.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.242.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.242.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.242.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.243.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.243.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.243.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.244.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.244.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.244.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.245.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.245.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.245.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.246.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.246.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.246.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.247.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.247.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.247.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.248.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.248.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.248.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.249.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.249.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.249.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.25.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.25.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.25.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.250.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.250.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.250.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.251.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.251.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.251.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.252.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.252.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.252.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.253.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.253.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.253.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.254.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.254.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.254.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.255.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.255.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.255.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.26.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.26.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.26.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.27.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.27.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.27.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.28.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.28.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.28.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.29.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.29.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.29.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.3.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.3.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.3.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.30.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.30.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.30.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.31.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.31.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.31.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.32.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.32.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.32.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.33.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.33.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.33.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.34.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.34.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.34.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.35.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.35.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.35.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.36.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.36.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.36.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.37.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.37.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.37.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.38.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.38.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.38.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.39.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.39.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.39.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.4.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.4.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.4.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.40.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.40.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.40.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.41.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.41.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.41.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.42.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.42.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.42.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.43.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.43.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.43.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.44.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.44.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.44.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.45.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.45.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.45.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.46.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.46.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.46.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.47.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.47.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.47.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.48.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.48.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.48.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.49.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.49.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.49.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.5.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.5.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.5.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.50.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.50.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.50.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.51.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.51.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.51.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.52.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.52.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.52.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.53.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.53.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.53.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.54.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.54.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.54.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.55.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.55.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.55.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.56.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.56.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.56.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.57.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.57.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.57.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.58.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.58.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.58.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.59.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.59.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.59.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.6.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.6.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.6.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.60.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.60.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.60.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.61.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.61.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.61.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.62.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.62.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.62.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.63.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.63.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.63.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.64.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.64.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.64.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.65.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.65.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.65.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.66.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.66.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.66.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.67.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.67.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.67.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.68.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.68.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.68.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.69.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.69.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.69.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.7.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.7.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.7.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.70.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.70.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.70.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.71.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.71.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.71.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.72.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.72.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.72.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.73.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.73.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.73.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.74.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.74.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.74.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.75.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.75.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.75.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.76.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.76.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.76.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.77.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.77.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.77.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.78.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.78.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.78.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.79.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.79.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.79.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.8.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.8.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.8.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.80.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.80.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.80.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.81.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.81.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.81.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.82.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.82.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.82.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.83.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.83.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.83.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.84.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.84.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.84.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.85.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.85.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.85.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.86.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.86.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.86.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.87.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.87.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.87.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.88.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.88.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.88.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.89.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.89.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.89.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.9.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.9.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.9.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.90.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.90.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.90.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.91.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.91.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.91.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.92.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.92.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.92.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.93.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.93.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.93.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.94.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.94.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.94.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.95.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.95.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.95.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.96.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.96.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.96.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.97.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.97.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.97.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.98.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.98.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.98.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.99.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.99.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.experts.gate_up_proj_list.99.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.gate.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.shared_expert.down_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.shared_expert.down_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.shared_expert.down_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.shared_expert.gate_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.shared_expert.gate_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.shared_expert.gate_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.shared_expert.up_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.shared_expert.up_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.shared_expert.up_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.shared_expert_gate.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.shared_expert_gate.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.mlp.shared_expert_gate.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.23.self_attn.k_norm.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.23.self_attn.k_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.self_attn.k_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.self_attn.k_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.self_attn.o_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.self_attn.o_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.self_attn.o_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.self_attn.q_norm.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.23.self_attn.q_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.self_attn.q_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.self_attn.q_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.23.self_attn.v_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.23.self_attn.v_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.23.self_attn.v_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.input_layernorm.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.24.linear_attn.A_log": "model-00003-of-00004.safetensors", "model.language_model.layers.24.linear_attn.conv1d.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.24.linear_attn.dt_bias": "model-00003-of-00004.safetensors", "model.language_model.layers.24.linear_attn.in_proj_a.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.linear_attn.in_proj_a.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.linear_attn.in_proj_a.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.linear_attn.in_proj_b.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.linear_attn.in_proj_b.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.linear_attn.in_proj_b.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.linear_attn.in_proj_qkv.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.linear_attn.in_proj_qkv.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.linear_attn.in_proj_qkv.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.linear_attn.in_proj_z.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.linear_attn.in_proj_z.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.linear_attn.in_proj_z.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.linear_attn.norm.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.24.linear_attn.out_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.linear_attn.out_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.linear_attn.out_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.0.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.0.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.0.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.1.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.1.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.1.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.10.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.10.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.10.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.100.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.100.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.100.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.101.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.101.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.101.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.102.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.102.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.102.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.103.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.103.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.103.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.104.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.104.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.104.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.105.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.105.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.105.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.106.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.106.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.106.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.107.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.107.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.107.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.108.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.108.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.108.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.109.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.109.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.109.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.11.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.11.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.11.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.110.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.110.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.110.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.111.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.111.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.111.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.112.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.112.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.112.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.113.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.113.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.113.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.114.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.114.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.114.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.115.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.115.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.115.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.116.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.116.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.116.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.117.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.117.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.117.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.118.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.118.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.118.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.119.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.119.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.119.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.12.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.12.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.12.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.120.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.120.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.120.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.121.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.121.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.121.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.122.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.122.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.122.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.123.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.123.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.123.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.124.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.124.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.124.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.125.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.125.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.125.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.126.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.126.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.126.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.127.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.127.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.127.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.128.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.128.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.128.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.129.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.129.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.129.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.13.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.13.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.13.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.130.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.130.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.130.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.131.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.131.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.131.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.132.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.132.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.132.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.133.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.133.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.133.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.134.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.134.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.134.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.135.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.135.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.135.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.136.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.136.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.136.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.137.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.137.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.137.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.138.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.138.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.138.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.139.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.139.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.139.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.14.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.14.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.14.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.140.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.140.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.140.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.141.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.141.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.141.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.142.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.142.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.142.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.143.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.143.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.143.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.144.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.144.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.144.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.145.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.145.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.145.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.146.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.146.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.146.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.147.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.147.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.147.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.148.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.148.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.148.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.149.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.149.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.149.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.15.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.15.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.15.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.150.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.150.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.150.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.151.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.151.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.151.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.152.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.152.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.152.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.153.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.153.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.153.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.154.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.154.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.154.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.155.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.155.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.155.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.156.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.156.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.156.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.157.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.157.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.157.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.158.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.158.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.158.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.159.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.159.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.159.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.16.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.16.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.16.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.160.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.160.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.160.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.161.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.161.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.161.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.162.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.162.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.162.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.163.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.163.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.163.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.164.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.164.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.164.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.165.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.165.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.165.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.166.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.166.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.166.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.167.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.167.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.167.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.168.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.168.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.168.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.169.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.169.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.169.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.17.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.17.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.17.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.170.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.170.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.170.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.171.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.171.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.171.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.172.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.172.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.172.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.173.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.173.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.173.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.174.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.174.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.174.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.175.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.175.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.175.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.176.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.176.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.176.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.177.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.177.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.177.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.178.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.178.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.178.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.179.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.179.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.179.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.18.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.18.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.18.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.180.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.180.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.180.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.181.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.181.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.181.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.182.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.182.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.182.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.183.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.183.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.183.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.184.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.184.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.184.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.185.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.185.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.185.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.186.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.186.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.186.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.187.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.187.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.187.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.188.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.188.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.188.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.189.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.189.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.189.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.19.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.19.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.19.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.190.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.190.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.190.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.191.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.191.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.191.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.192.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.192.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.192.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.193.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.193.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.193.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.194.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.194.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.194.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.195.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.195.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.195.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.196.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.196.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.196.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.197.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.197.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.197.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.198.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.198.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.198.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.199.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.199.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.199.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.2.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.2.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.2.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.20.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.20.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.20.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.200.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.200.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.200.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.201.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.201.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.201.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.202.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.202.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.202.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.203.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.203.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.203.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.204.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.204.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.204.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.205.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.205.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.205.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.206.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.206.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.206.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.207.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.207.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.207.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.208.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.208.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.208.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.209.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.209.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.209.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.21.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.21.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.21.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.210.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.210.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.210.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.211.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.211.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.211.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.212.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.212.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.212.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.213.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.213.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.213.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.214.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.214.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.214.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.215.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.215.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.215.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.216.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.216.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.216.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.217.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.217.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.217.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.218.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.218.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.218.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.219.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.219.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.219.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.22.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.22.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.22.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.220.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.220.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.220.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.221.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.221.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.221.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.222.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.222.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.222.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.223.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.223.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.223.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.224.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.224.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.224.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.225.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.225.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.225.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.226.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.226.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.226.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.227.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.227.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.227.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.228.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.228.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.228.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.229.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.229.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.229.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.23.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.23.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.23.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.230.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.230.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.230.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.231.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.231.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.231.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.232.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.232.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.232.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.233.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.233.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.233.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.234.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.234.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.234.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.235.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.235.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.235.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.236.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.236.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.236.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.237.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.237.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.237.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.238.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.238.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.238.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.239.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.239.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.239.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.24.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.24.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.24.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.240.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.240.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.240.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.241.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.241.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.241.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.242.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.242.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.242.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.243.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.243.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.243.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.244.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.244.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.244.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.245.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.245.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.245.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.246.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.246.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.246.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.247.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.247.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.247.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.248.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.248.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.248.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.249.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.249.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.249.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.25.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.25.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.25.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.250.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.250.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.250.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.251.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.251.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.251.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.252.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.252.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.252.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.253.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.253.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.253.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.254.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.254.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.254.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.255.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.255.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.255.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.26.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.26.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.26.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.27.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.27.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.27.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.28.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.28.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.28.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.29.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.29.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.29.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.3.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.3.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.3.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.30.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.30.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.30.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.31.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.31.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.31.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.32.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.32.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.32.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.33.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.33.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.33.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.34.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.34.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.34.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.35.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.35.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.35.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.36.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.36.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.36.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.37.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.37.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.37.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.38.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.38.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.38.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.39.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.39.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.39.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.4.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.4.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.4.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.40.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.40.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.40.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.41.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.41.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.41.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.42.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.42.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.42.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.43.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.43.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.43.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.44.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.44.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.44.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.45.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.45.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.45.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.46.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.46.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.46.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.47.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.47.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.47.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.48.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.48.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.48.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.49.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.49.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.49.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.5.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.5.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.5.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.50.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.50.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.50.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.51.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.51.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.51.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.52.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.52.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.52.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.53.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.53.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.53.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.54.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.54.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.54.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.55.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.55.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.55.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.56.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.56.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.56.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.57.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.57.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.57.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.58.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.58.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.58.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.59.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.59.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.59.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.6.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.6.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.6.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.60.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.60.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.60.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.61.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.61.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.61.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.62.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.62.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.62.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.63.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.63.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.63.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.64.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.64.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.64.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.65.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.65.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.65.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.66.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.66.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.66.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.67.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.67.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.67.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.68.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.68.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.68.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.69.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.69.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.69.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.7.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.7.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.7.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.70.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.70.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.70.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.71.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.71.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.71.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.72.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.72.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.72.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.73.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.73.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.73.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.74.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.74.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.74.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.75.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.75.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.75.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.76.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.76.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.76.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.77.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.77.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.77.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.78.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.78.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.78.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.79.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.79.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.79.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.8.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.8.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.8.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.80.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.80.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.80.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.81.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.81.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.81.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.82.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.82.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.82.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.83.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.83.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.83.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.84.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.84.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.84.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.85.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.85.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.85.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.86.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.86.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.86.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.87.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.87.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.87.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.88.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.88.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.88.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.89.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.89.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.89.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.9.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.9.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.9.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.90.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.90.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.90.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.91.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.91.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.91.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.92.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.92.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.92.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.93.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.93.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.93.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.94.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.94.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.94.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.95.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.95.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.95.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.96.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.96.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.96.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.97.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.97.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.97.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.98.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.98.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.98.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.99.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.99.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.down_proj_list.99.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.0.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.0.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.0.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.1.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.1.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.1.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.10.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.10.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.10.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.100.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.100.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.100.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.101.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.101.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.101.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.102.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.102.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.102.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.103.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.103.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.103.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.104.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.104.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.104.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.105.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.105.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.105.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.106.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.106.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.106.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.107.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.107.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.107.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.108.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.108.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.108.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.109.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.109.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.109.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.11.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.11.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.11.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.110.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.110.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.110.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.111.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.111.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.111.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.112.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.112.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.112.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.113.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.113.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.113.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.114.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.114.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.114.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.115.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.115.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.115.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.116.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.116.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.116.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.117.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.117.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.117.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.118.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.118.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.118.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.119.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.119.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.119.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.12.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.12.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.12.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.120.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.120.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.120.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.121.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.121.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.121.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.122.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.122.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.122.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.123.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.123.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.123.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.124.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.124.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.124.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.125.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.125.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.125.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.126.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.126.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.126.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.127.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.127.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.127.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.128.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.128.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.128.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.129.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.129.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.129.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.13.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.13.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.13.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.130.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.130.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.130.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.131.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.131.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.131.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.132.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.132.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.132.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.133.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.133.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.133.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.134.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.134.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.134.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.135.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.135.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.135.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.136.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.136.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.136.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.137.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.137.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.137.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.138.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.138.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.138.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.139.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.139.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.139.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.14.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.14.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.14.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.140.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.140.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.140.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.141.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.141.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.141.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.142.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.142.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.142.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.143.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.143.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.143.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.144.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.144.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.144.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.145.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.145.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.145.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.146.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.146.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.146.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.147.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.147.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.147.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.148.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.148.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.148.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.149.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.149.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.149.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.15.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.15.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.15.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.150.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.150.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.150.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.151.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.151.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.151.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.152.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.152.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.152.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.153.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.153.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.153.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.154.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.154.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.154.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.155.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.155.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.155.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.156.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.156.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.156.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.157.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.157.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.157.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.158.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.158.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.158.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.159.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.159.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.159.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.16.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.16.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.16.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.160.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.160.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.160.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.161.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.161.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.161.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.162.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.162.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.162.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.163.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.163.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.163.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.164.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.164.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.164.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.165.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.165.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.165.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.166.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.166.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.166.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.167.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.167.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.167.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.168.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.168.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.168.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.169.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.169.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.169.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.17.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.17.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.17.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.170.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.170.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.170.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.171.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.171.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.171.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.172.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.172.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.172.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.173.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.173.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.173.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.174.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.174.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.174.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.175.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.175.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.175.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.176.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.176.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.176.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.177.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.177.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.177.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.178.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.178.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.178.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.179.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.179.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.179.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.18.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.18.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.18.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.180.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.180.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.180.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.181.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.181.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.181.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.182.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.182.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.182.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.183.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.183.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.183.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.184.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.184.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.184.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.185.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.185.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.185.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.186.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.186.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.186.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.187.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.187.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.187.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.188.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.188.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.188.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.189.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.189.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.189.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.19.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.19.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.19.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.190.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.190.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.190.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.191.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.191.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.191.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.192.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.192.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.192.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.193.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.193.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.193.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.194.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.194.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.194.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.195.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.195.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.195.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.196.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.196.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.196.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.197.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.197.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.197.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.198.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.198.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.198.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.199.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.199.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.199.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.2.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.2.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.2.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.20.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.20.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.20.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.200.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.200.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.200.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.201.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.201.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.201.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.202.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.202.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.202.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.203.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.203.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.203.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.204.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.204.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.204.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.205.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.205.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.205.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.206.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.206.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.206.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.207.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.207.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.207.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.208.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.208.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.208.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.209.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.209.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.209.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.21.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.21.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.21.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.210.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.210.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.210.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.211.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.211.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.211.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.212.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.212.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.212.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.213.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.213.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.213.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.214.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.214.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.214.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.215.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.215.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.215.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.216.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.216.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.216.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.217.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.217.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.217.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.218.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.218.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.218.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.219.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.219.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.219.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.22.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.22.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.22.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.220.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.220.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.220.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.221.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.221.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.221.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.222.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.222.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.222.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.223.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.223.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.223.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.224.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.224.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.224.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.225.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.225.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.225.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.226.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.226.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.226.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.227.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.227.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.227.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.228.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.228.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.228.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.229.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.229.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.229.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.23.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.23.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.23.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.230.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.230.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.230.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.231.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.231.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.231.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.232.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.232.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.232.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.233.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.233.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.233.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.234.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.234.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.234.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.235.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.235.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.235.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.236.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.236.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.236.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.237.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.237.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.237.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.238.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.238.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.238.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.239.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.239.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.239.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.24.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.24.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.24.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.240.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.240.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.240.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.241.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.241.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.241.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.242.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.242.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.242.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.243.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.243.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.243.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.244.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.244.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.244.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.245.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.245.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.245.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.246.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.246.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.246.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.247.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.247.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.247.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.248.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.248.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.248.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.249.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.249.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.249.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.25.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.25.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.25.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.250.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.250.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.250.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.251.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.251.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.251.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.252.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.252.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.252.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.253.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.253.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.253.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.254.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.254.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.254.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.255.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.255.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.255.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.26.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.26.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.26.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.27.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.27.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.27.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.28.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.28.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.28.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.29.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.29.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.29.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.3.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.3.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.3.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.30.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.30.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.30.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.31.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.31.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.31.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.32.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.32.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.32.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.33.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.33.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.33.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.34.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.34.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.34.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.35.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.35.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.35.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.36.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.36.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.36.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.37.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.37.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.37.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.38.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.38.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.38.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.39.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.39.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.39.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.4.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.4.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.4.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.40.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.40.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.40.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.41.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.41.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.41.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.42.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.42.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.42.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.43.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.43.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.43.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.44.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.44.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.44.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.45.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.45.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.45.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.46.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.46.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.46.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.47.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.47.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.47.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.48.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.48.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.48.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.49.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.49.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.49.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.5.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.5.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.5.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.50.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.50.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.50.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.51.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.51.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.51.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.52.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.52.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.52.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.53.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.53.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.53.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.54.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.54.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.54.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.55.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.55.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.55.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.56.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.56.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.56.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.57.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.57.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.57.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.58.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.58.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.58.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.59.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.59.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.59.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.6.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.6.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.6.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.60.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.60.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.60.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.61.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.61.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.61.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.62.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.62.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.62.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.63.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.63.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.63.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.64.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.64.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.64.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.65.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.65.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.65.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.66.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.66.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.66.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.67.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.67.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.67.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.68.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.68.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.68.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.69.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.69.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.69.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.7.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.7.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.7.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.70.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.70.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.70.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.71.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.71.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.71.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.72.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.72.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.72.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.73.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.73.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.73.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.74.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.74.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.74.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.75.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.75.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.75.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.76.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.76.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.76.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.77.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.77.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.77.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.78.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.78.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.78.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.79.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.79.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.79.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.8.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.8.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.8.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.80.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.80.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.80.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.81.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.81.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.81.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.82.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.82.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.82.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.83.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.83.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.83.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.84.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.84.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.84.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.85.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.85.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.85.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.86.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.86.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.86.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.87.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.87.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.87.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.88.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.88.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.88.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.89.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.89.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.89.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.9.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.9.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.9.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.90.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.90.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.90.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.91.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.91.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.91.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.92.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.92.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.92.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.93.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.93.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.93.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.94.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.94.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.94.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.95.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.95.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.95.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.96.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.96.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.96.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.97.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.97.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.97.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.98.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.98.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.98.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.99.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.99.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.experts.gate_up_proj_list.99.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.gate.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.shared_expert.down_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.shared_expert.down_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.shared_expert.down_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.shared_expert.gate_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.shared_expert.gate_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.shared_expert.gate_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.shared_expert.up_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.shared_expert.up_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.shared_expert.up_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.shared_expert_gate.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.shared_expert_gate.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.24.mlp.shared_expert_gate.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.24.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.25.input_layernorm.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.25.linear_attn.A_log": "model-00003-of-00004.safetensors", "model.language_model.layers.25.linear_attn.conv1d.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.25.linear_attn.dt_bias": "model-00003-of-00004.safetensors", "model.language_model.layers.25.linear_attn.in_proj_a.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.linear_attn.in_proj_a.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.linear_attn.in_proj_a.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.linear_attn.in_proj_b.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.linear_attn.in_proj_b.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.linear_attn.in_proj_b.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.linear_attn.in_proj_qkv.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.linear_attn.in_proj_qkv.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.linear_attn.in_proj_qkv.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.linear_attn.in_proj_z.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.linear_attn.in_proj_z.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.linear_attn.in_proj_z.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.linear_attn.norm.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.25.linear_attn.out_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.linear_attn.out_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.linear_attn.out_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.0.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.0.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.0.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.1.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.1.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.1.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.10.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.10.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.10.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.100.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.100.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.100.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.101.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.101.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.101.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.102.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.102.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.102.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.103.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.103.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.103.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.104.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.104.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.104.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.105.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.105.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.105.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.106.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.106.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.106.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.107.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.107.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.107.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.108.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.108.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.108.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.109.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.109.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.109.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.11.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.11.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.11.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.110.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.110.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.110.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.111.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.111.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.111.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.112.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.112.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.112.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.113.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.113.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.113.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.114.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.114.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.114.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.115.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.115.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.115.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.116.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.116.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.116.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.117.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.117.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.117.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.118.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.118.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.118.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.119.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.119.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.119.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.12.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.12.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.12.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.120.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.120.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.120.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.121.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.121.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.121.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.122.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.122.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.122.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.123.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.123.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.123.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.124.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.124.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.124.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.125.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.125.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.125.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.126.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.126.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.126.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.127.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.127.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.127.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.128.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.128.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.128.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.129.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.129.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.129.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.13.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.13.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.13.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.130.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.130.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.130.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.131.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.131.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.131.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.132.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.132.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.132.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.133.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.133.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.133.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.134.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.134.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.134.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.135.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.135.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.135.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.136.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.136.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.136.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.137.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.137.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.137.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.138.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.138.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.138.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.139.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.139.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.139.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.14.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.14.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.14.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.140.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.140.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.140.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.141.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.141.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.141.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.142.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.142.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.142.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.143.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.143.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.143.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.144.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.144.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.144.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.145.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.145.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.145.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.146.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.146.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.146.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.147.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.147.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.147.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.148.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.148.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.148.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.149.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.149.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.149.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.15.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.15.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.15.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.150.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.150.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.150.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.151.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.151.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.151.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.152.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.152.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.152.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.153.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.153.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.153.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.154.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.154.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.154.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.155.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.155.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.155.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.156.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.156.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.156.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.157.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.157.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.157.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.158.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.158.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.158.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.159.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.159.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.159.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.16.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.16.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.16.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.160.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.160.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.160.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.161.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.161.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.161.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.162.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.162.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.162.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.163.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.163.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.163.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.164.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.164.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.164.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.165.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.165.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.165.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.166.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.166.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.166.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.167.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.167.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.167.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.168.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.168.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.168.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.169.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.169.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.169.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.17.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.17.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.17.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.170.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.170.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.170.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.171.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.171.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.171.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.172.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.172.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.172.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.173.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.173.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.173.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.174.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.174.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.174.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.175.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.175.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.175.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.176.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.176.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.176.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.177.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.177.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.177.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.178.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.178.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.178.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.179.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.179.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.179.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.18.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.18.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.18.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.180.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.180.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.180.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.181.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.181.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.181.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.182.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.182.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.182.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.183.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.183.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.183.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.184.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.184.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.184.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.185.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.185.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.185.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.186.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.186.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.186.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.187.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.187.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.187.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.188.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.188.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.188.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.189.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.189.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.189.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.19.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.19.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.19.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.190.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.190.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.190.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.191.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.191.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.191.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.192.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.192.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.192.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.193.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.193.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.193.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.194.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.194.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.194.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.195.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.195.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.195.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.196.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.196.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.196.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.197.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.197.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.197.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.198.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.198.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.198.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.199.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.199.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.199.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.2.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.2.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.2.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.20.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.20.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.20.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.200.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.200.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.200.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.201.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.201.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.201.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.202.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.202.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.202.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.203.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.203.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.203.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.204.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.204.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.204.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.205.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.205.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.205.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.206.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.206.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.206.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.207.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.207.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.207.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.208.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.208.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.208.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.209.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.209.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.209.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.21.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.21.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.21.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.210.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.210.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.210.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.211.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.211.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.211.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.212.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.212.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.212.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.213.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.213.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.213.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.214.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.214.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.214.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.215.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.215.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.215.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.216.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.216.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.216.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.217.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.217.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.217.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.218.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.218.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.218.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.219.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.219.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.219.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.22.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.22.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.22.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.220.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.220.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.220.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.221.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.221.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.221.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.222.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.222.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.222.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.223.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.223.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.223.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.224.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.224.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.224.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.225.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.225.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.225.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.226.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.226.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.226.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.227.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.227.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.227.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.228.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.228.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.228.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.229.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.229.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.229.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.23.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.23.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.23.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.230.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.230.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.230.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.231.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.231.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.231.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.232.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.232.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.232.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.233.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.233.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.233.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.234.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.234.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.234.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.235.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.235.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.235.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.236.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.236.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.236.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.237.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.237.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.237.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.238.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.238.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.238.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.239.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.239.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.239.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.24.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.24.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.24.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.240.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.240.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.240.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.241.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.241.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.241.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.242.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.242.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.242.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.243.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.243.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.243.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.244.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.244.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.244.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.245.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.245.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.245.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.246.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.246.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.246.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.247.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.247.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.247.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.248.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.248.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.248.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.249.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.249.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.249.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.25.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.25.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.25.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.250.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.250.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.250.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.251.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.251.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.251.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.252.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.252.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.252.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.253.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.253.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.253.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.254.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.254.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.254.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.255.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.255.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.255.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.26.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.26.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.26.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.27.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.27.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.27.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.28.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.28.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.28.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.29.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.29.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.29.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.3.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.3.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.3.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.30.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.30.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.30.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.31.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.31.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.31.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.32.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.32.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.32.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.33.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.33.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.33.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.34.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.34.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.34.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.35.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.35.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.35.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.36.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.36.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.36.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.37.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.37.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.37.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.38.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.38.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.38.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.39.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.39.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.39.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.4.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.4.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.4.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.40.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.40.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.40.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.41.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.41.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.41.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.42.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.42.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.42.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.43.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.43.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.43.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.44.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.44.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.44.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.45.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.45.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.45.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.46.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.46.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.46.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.47.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.47.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.47.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.48.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.48.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.48.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.49.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.49.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.49.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.5.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.5.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.5.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.50.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.50.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.50.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.51.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.51.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.51.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.52.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.52.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.52.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.53.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.53.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.53.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.54.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.54.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.54.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.55.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.55.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.55.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.56.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.56.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.56.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.57.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.57.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.57.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.58.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.58.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.58.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.59.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.59.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.59.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.6.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.6.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.6.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.60.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.60.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.60.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.61.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.61.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.61.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.62.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.62.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.62.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.63.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.63.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.63.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.64.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.64.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.64.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.65.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.65.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.65.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.66.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.66.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.66.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.67.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.67.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.67.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.68.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.68.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.68.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.69.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.69.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.69.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.7.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.7.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.7.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.70.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.70.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.70.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.71.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.71.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.71.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.72.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.72.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.72.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.73.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.73.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.73.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.74.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.74.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.74.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.75.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.75.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.75.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.76.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.76.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.76.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.77.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.77.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.77.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.78.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.78.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.78.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.79.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.79.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.79.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.8.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.8.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.8.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.80.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.80.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.80.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.81.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.81.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.81.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.82.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.82.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.82.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.83.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.83.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.83.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.84.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.84.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.84.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.85.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.85.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.85.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.86.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.86.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.86.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.87.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.87.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.87.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.88.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.88.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.88.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.89.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.89.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.89.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.9.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.9.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.9.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.90.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.90.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.90.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.91.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.91.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.91.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.92.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.92.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.92.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.93.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.93.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.93.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.94.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.94.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.94.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.95.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.95.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.95.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.96.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.96.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.96.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.97.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.97.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.97.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.98.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.98.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.98.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.99.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.99.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.down_proj_list.99.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.0.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.0.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.0.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.1.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.1.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.1.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.10.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.10.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.10.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.100.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.100.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.100.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.101.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.101.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.101.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.102.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.102.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.102.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.103.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.103.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.103.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.104.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.104.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.104.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.105.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.105.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.105.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.106.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.106.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.106.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.107.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.107.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.107.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.108.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.108.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.108.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.109.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.109.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.109.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.11.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.11.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.11.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.110.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.110.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.110.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.111.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.111.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.111.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.112.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.112.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.112.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.113.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.113.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.113.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.114.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.114.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.114.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.115.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.115.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.115.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.116.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.116.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.116.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.117.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.117.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.117.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.118.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.118.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.118.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.119.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.119.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.119.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.12.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.12.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.12.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.120.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.120.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.120.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.121.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.121.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.121.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.122.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.122.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.122.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.123.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.123.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.123.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.124.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.124.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.124.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.125.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.125.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.125.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.126.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.126.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.126.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.127.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.127.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.127.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.128.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.128.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.128.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.129.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.129.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.129.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.13.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.13.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.13.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.130.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.130.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.130.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.131.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.131.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.131.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.132.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.132.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.132.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.133.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.133.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.133.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.134.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.134.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.134.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.135.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.135.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.135.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.136.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.136.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.136.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.137.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.137.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.137.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.138.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.138.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.138.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.139.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.139.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.139.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.14.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.14.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.14.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.140.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.140.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.140.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.141.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.141.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.141.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.142.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.142.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.142.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.143.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.143.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.143.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.144.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.144.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.144.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.145.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.145.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.145.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.146.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.146.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.146.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.147.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.147.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.147.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.148.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.148.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.148.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.149.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.149.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.149.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.15.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.15.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.15.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.150.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.150.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.150.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.151.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.151.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.151.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.152.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.152.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.152.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.153.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.153.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.153.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.154.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.154.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.154.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.155.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.155.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.155.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.156.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.156.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.156.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.157.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.157.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.157.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.158.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.158.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.158.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.159.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.159.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.159.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.16.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.16.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.16.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.160.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.160.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.160.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.161.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.161.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.161.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.162.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.162.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.162.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.163.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.163.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.163.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.164.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.164.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.164.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.165.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.165.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.165.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.166.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.166.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.166.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.167.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.167.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.167.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.168.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.168.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.168.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.169.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.169.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.169.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.17.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.17.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.17.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.170.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.170.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.170.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.171.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.171.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.171.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.172.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.172.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.172.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.173.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.173.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.173.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.174.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.174.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.174.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.175.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.175.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.175.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.176.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.176.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.176.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.177.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.177.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.177.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.178.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.178.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.178.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.179.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.179.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.179.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.18.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.18.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.18.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.180.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.180.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.180.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.181.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.181.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.181.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.182.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.182.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.182.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.183.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.183.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.183.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.184.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.184.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.184.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.185.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.185.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.185.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.186.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.186.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.186.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.187.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.187.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.187.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.188.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.188.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.188.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.189.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.189.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.189.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.19.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.19.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.19.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.190.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.190.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.190.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.191.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.191.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.191.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.192.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.192.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.192.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.193.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.193.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.193.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.194.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.194.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.194.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.195.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.195.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.195.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.196.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.196.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.196.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.197.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.197.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.197.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.198.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.198.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.198.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.199.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.199.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.199.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.2.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.2.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.2.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.20.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.20.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.20.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.200.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.200.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.200.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.201.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.201.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.201.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.202.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.202.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.202.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.203.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.203.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.203.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.204.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.204.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.204.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.205.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.205.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.205.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.206.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.206.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.206.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.207.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.207.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.207.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.208.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.208.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.208.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.209.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.209.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.209.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.21.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.21.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.21.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.210.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.210.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.210.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.211.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.211.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.211.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.212.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.212.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.212.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.213.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.213.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.213.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.214.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.214.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.214.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.215.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.215.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.215.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.216.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.216.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.216.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.217.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.217.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.217.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.218.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.218.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.218.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.219.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.219.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.219.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.22.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.22.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.22.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.220.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.220.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.220.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.221.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.221.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.221.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.222.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.222.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.222.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.223.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.223.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.223.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.224.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.224.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.224.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.225.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.225.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.225.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.226.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.226.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.226.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.227.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.227.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.227.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.228.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.228.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.228.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.229.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.229.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.229.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.23.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.23.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.23.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.230.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.230.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.230.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.231.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.231.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.231.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.232.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.232.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.232.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.233.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.233.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.233.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.234.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.234.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.234.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.235.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.235.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.235.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.236.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.236.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.236.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.237.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.237.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.237.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.238.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.238.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.238.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.239.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.239.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.239.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.24.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.24.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.24.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.240.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.240.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.240.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.241.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.241.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.241.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.242.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.242.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.242.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.243.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.243.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.243.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.244.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.244.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.244.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.245.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.245.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.245.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.246.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.246.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.246.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.247.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.247.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.247.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.248.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.248.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.248.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.249.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.249.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.249.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.25.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.25.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.25.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.250.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.250.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.250.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.251.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.251.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.251.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.252.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.252.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.252.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.253.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.253.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.253.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.254.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.254.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.254.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.255.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.255.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.255.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.26.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.26.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.26.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.27.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.27.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.27.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.28.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.28.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.28.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.29.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.29.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.29.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.3.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.3.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.3.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.30.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.30.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.30.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.31.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.31.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.31.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.32.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.32.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.32.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.33.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.33.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.33.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.34.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.34.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.34.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.35.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.35.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.35.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.36.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.36.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.36.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.37.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.37.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.37.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.38.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.38.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.38.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.39.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.39.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.39.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.4.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.4.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.4.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.40.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.40.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.40.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.41.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.41.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.41.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.42.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.42.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.42.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.43.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.43.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.43.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.44.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.44.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.44.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.45.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.45.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.45.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.46.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.46.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.46.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.47.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.47.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.47.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.48.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.48.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.48.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.49.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.49.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.49.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.5.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.5.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.5.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.50.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.50.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.50.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.51.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.51.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.51.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.52.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.52.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.52.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.53.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.53.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.53.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.54.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.54.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.54.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.55.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.55.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.55.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.56.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.56.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.56.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.57.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.57.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.57.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.58.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.58.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.58.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.59.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.59.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.59.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.6.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.6.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.6.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.60.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.60.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.60.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.61.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.61.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.61.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.62.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.62.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.62.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.63.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.63.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.63.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.64.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.64.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.64.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.65.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.65.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.65.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.66.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.66.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.66.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.67.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.67.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.67.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.68.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.68.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.68.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.69.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.69.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.69.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.7.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.7.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.7.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.70.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.70.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.70.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.71.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.71.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.71.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.72.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.72.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.72.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.73.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.73.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.73.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.74.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.74.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.74.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.75.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.75.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.75.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.76.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.76.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.76.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.77.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.77.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.77.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.78.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.78.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.78.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.79.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.79.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.79.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.8.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.8.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.8.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.80.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.80.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.80.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.81.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.81.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.81.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.82.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.82.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.82.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.83.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.83.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.83.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.84.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.84.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.84.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.85.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.85.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.85.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.86.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.86.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.86.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.87.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.87.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.87.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.88.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.88.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.88.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.89.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.89.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.89.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.9.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.9.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.9.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.90.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.90.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.90.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.91.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.91.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.91.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.92.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.92.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.92.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.93.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.93.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.93.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.94.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.94.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.94.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.95.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.95.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.95.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.96.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.96.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.96.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.97.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.97.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.97.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.98.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.98.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.98.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.99.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.99.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.experts.gate_up_proj_list.99.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.gate.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.shared_expert.down_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.shared_expert.down_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.shared_expert.down_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.shared_expert.gate_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.shared_expert.gate_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.shared_expert.gate_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.shared_expert.up_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.shared_expert.up_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.shared_expert.up_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.shared_expert_gate.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.shared_expert_gate.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.25.mlp.shared_expert_gate.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.25.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.26.input_layernorm.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.26.linear_attn.A_log": "model-00003-of-00004.safetensors", "model.language_model.layers.26.linear_attn.conv1d.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.26.linear_attn.dt_bias": "model-00003-of-00004.safetensors", "model.language_model.layers.26.linear_attn.in_proj_a.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.linear_attn.in_proj_a.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.linear_attn.in_proj_a.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.linear_attn.in_proj_b.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.linear_attn.in_proj_b.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.linear_attn.in_proj_b.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.linear_attn.in_proj_qkv.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.linear_attn.in_proj_qkv.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.linear_attn.in_proj_qkv.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.linear_attn.in_proj_z.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.linear_attn.in_proj_z.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.linear_attn.in_proj_z.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.linear_attn.norm.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.26.linear_attn.out_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.linear_attn.out_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.linear_attn.out_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.0.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.0.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.0.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.1.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.1.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.1.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.10.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.10.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.10.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.100.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.100.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.100.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.101.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.101.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.101.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.102.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.102.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.102.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.103.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.103.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.103.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.104.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.104.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.104.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.105.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.105.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.105.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.106.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.106.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.106.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.107.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.107.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.107.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.108.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.108.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.108.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.109.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.109.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.109.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.11.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.11.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.11.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.110.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.110.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.110.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.111.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.111.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.111.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.112.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.112.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.112.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.113.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.113.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.113.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.114.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.114.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.114.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.115.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.115.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.115.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.116.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.116.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.116.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.117.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.117.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.117.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.118.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.118.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.118.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.119.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.119.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.119.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.12.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.12.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.12.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.120.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.120.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.120.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.121.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.121.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.121.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.122.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.122.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.122.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.123.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.123.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.123.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.124.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.124.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.124.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.125.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.125.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.125.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.126.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.126.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.126.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.127.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.127.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.127.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.128.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.128.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.128.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.129.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.129.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.129.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.13.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.13.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.13.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.130.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.130.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.130.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.131.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.131.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.131.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.132.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.132.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.132.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.133.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.133.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.133.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.134.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.134.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.134.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.135.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.135.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.135.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.136.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.136.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.136.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.137.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.137.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.137.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.138.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.138.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.138.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.139.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.139.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.139.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.14.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.14.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.14.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.140.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.140.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.140.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.141.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.141.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.141.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.142.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.142.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.142.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.143.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.143.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.143.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.144.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.144.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.144.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.145.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.145.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.145.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.146.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.146.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.146.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.147.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.147.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.147.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.148.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.148.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.148.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.149.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.149.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.149.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.15.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.15.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.15.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.150.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.150.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.150.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.151.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.151.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.151.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.152.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.152.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.152.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.153.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.153.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.153.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.154.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.154.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.154.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.155.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.155.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.155.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.156.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.156.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.156.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.157.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.157.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.157.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.158.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.158.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.158.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.159.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.159.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.159.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.16.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.16.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.16.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.160.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.160.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.160.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.161.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.161.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.161.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.162.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.162.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.162.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.163.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.163.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.163.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.164.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.164.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.164.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.165.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.165.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.165.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.166.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.166.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.166.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.167.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.167.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.167.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.168.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.168.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.168.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.169.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.169.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.169.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.17.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.17.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.17.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.170.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.170.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.170.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.171.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.171.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.171.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.172.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.172.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.172.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.173.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.173.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.173.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.174.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.174.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.174.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.175.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.175.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.175.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.176.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.176.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.176.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.177.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.177.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.177.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.178.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.178.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.178.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.179.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.179.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.179.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.18.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.18.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.18.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.180.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.180.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.180.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.181.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.181.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.181.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.182.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.182.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.182.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.183.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.183.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.183.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.184.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.184.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.184.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.185.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.185.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.185.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.186.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.186.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.186.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.187.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.187.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.187.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.188.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.188.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.188.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.189.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.189.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.189.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.19.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.19.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.19.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.190.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.190.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.190.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.191.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.191.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.191.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.192.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.192.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.192.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.193.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.193.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.193.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.194.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.194.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.194.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.195.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.195.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.195.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.196.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.196.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.196.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.197.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.197.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.197.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.198.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.198.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.198.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.199.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.199.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.199.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.2.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.2.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.2.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.20.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.20.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.20.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.200.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.200.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.200.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.201.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.201.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.201.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.202.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.202.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.202.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.203.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.203.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.203.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.204.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.204.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.204.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.205.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.205.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.205.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.206.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.206.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.206.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.207.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.207.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.207.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.208.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.208.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.208.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.209.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.209.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.209.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.21.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.21.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.21.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.210.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.210.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.210.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.211.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.211.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.211.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.212.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.212.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.212.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.213.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.213.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.213.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.214.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.214.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.214.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.215.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.215.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.215.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.216.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.216.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.216.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.217.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.217.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.217.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.218.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.218.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.218.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.219.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.219.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.219.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.22.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.22.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.22.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.220.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.220.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.220.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.221.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.221.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.221.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.222.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.222.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.222.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.223.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.223.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.223.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.224.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.224.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.224.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.225.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.225.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.225.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.226.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.226.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.226.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.227.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.227.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.227.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.228.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.228.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.228.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.229.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.229.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.229.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.23.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.23.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.23.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.230.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.230.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.230.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.231.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.231.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.231.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.232.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.232.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.232.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.233.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.233.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.233.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.234.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.234.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.234.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.235.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.235.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.235.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.236.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.236.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.236.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.237.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.237.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.237.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.238.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.238.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.238.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.239.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.239.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.239.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.24.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.24.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.24.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.240.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.240.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.240.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.241.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.241.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.241.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.242.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.242.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.242.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.243.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.243.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.243.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.244.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.244.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.244.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.245.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.245.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.245.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.246.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.246.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.246.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.247.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.247.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.247.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.248.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.248.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.248.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.249.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.249.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.249.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.25.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.25.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.25.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.250.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.250.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.250.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.251.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.251.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.251.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.252.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.252.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.252.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.253.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.253.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.253.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.254.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.254.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.254.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.255.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.255.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.255.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.26.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.26.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.26.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.27.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.27.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.27.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.28.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.28.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.28.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.29.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.29.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.29.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.3.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.3.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.3.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.30.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.30.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.30.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.31.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.31.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.31.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.32.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.32.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.32.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.33.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.33.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.33.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.34.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.34.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.34.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.35.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.35.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.35.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.36.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.36.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.36.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.37.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.37.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.37.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.38.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.38.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.38.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.39.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.39.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.39.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.4.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.4.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.4.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.40.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.40.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.40.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.41.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.41.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.41.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.42.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.42.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.42.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.43.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.43.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.43.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.44.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.44.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.44.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.45.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.45.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.45.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.46.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.46.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.46.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.47.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.47.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.47.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.48.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.48.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.48.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.49.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.49.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.49.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.5.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.5.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.5.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.50.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.50.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.50.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.51.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.51.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.51.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.52.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.52.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.52.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.53.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.53.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.53.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.54.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.54.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.54.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.55.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.55.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.55.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.56.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.56.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.56.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.57.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.57.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.57.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.58.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.58.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.58.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.59.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.59.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.59.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.6.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.6.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.6.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.60.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.60.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.60.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.61.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.61.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.61.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.62.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.62.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.62.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.63.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.63.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.63.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.64.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.64.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.64.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.65.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.65.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.65.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.66.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.66.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.66.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.67.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.67.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.67.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.68.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.68.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.68.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.69.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.69.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.69.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.7.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.7.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.7.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.70.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.70.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.70.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.71.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.71.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.71.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.72.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.72.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.72.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.73.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.73.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.73.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.74.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.74.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.74.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.75.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.75.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.75.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.76.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.76.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.76.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.77.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.77.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.77.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.78.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.78.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.78.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.79.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.79.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.79.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.8.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.8.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.8.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.80.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.80.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.80.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.81.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.81.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.81.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.82.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.82.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.82.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.83.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.83.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.83.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.84.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.84.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.84.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.85.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.85.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.85.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.86.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.86.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.86.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.87.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.87.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.87.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.88.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.88.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.88.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.89.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.89.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.89.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.9.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.9.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.9.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.90.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.90.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.90.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.91.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.91.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.91.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.92.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.92.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.92.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.93.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.93.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.93.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.94.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.94.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.94.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.95.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.95.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.95.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.96.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.96.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.96.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.97.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.97.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.97.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.98.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.98.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.98.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.99.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.99.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.down_proj_list.99.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.0.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.0.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.0.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.1.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.1.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.1.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.10.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.10.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.10.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.100.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.100.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.100.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.101.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.101.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.101.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.102.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.102.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.102.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.103.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.103.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.103.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.104.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.104.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.104.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.105.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.105.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.105.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.106.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.106.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.106.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.107.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.107.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.107.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.108.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.108.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.108.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.109.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.109.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.109.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.11.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.11.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.11.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.110.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.110.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.110.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.111.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.111.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.111.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.112.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.112.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.112.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.113.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.113.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.113.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.114.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.114.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.114.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.115.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.115.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.115.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.116.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.116.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.116.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.117.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.117.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.117.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.118.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.118.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.118.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.119.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.119.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.119.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.12.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.12.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.12.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.120.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.120.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.120.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.121.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.121.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.121.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.122.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.122.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.122.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.123.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.123.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.123.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.124.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.124.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.124.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.125.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.125.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.125.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.126.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.126.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.126.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.127.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.127.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.127.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.128.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.128.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.128.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.129.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.129.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.129.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.13.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.13.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.13.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.130.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.130.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.130.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.131.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.131.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.131.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.132.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.132.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.132.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.133.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.133.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.133.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.134.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.134.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.134.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.135.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.135.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.135.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.136.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.136.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.136.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.137.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.137.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.137.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.138.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.138.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.138.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.139.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.139.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.139.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.14.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.14.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.14.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.140.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.140.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.140.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.141.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.141.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.141.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.142.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.142.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.142.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.143.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.143.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.143.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.144.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.144.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.144.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.145.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.145.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.145.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.146.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.146.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.146.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.147.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.147.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.147.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.148.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.148.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.148.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.149.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.149.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.149.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.15.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.15.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.15.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.150.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.150.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.150.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.151.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.151.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.151.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.152.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.152.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.152.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.153.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.153.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.153.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.154.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.154.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.154.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.155.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.155.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.155.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.156.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.156.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.156.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.157.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.157.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.157.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.158.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.158.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.158.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.159.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.159.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.159.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.16.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.16.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.16.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.160.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.160.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.160.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.161.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.161.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.161.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.162.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.162.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.162.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.163.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.163.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.163.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.164.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.164.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.164.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.165.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.165.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.165.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.166.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.166.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.166.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.167.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.167.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.167.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.168.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.168.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.168.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.169.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.169.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.169.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.17.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.17.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.17.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.170.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.170.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.170.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.171.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.171.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.171.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.172.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.172.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.172.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.173.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.173.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.173.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.174.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.174.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.174.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.175.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.175.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.175.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.176.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.176.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.176.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.177.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.177.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.177.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.178.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.178.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.178.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.179.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.179.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.179.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.18.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.18.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.18.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.180.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.180.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.180.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.181.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.181.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.181.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.182.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.182.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.182.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.183.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.183.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.183.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.184.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.184.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.184.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.185.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.185.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.185.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.186.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.186.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.186.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.187.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.187.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.187.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.188.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.188.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.188.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.189.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.189.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.189.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.19.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.19.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.19.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.190.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.190.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.190.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.191.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.191.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.191.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.192.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.192.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.192.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.193.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.193.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.193.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.194.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.194.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.194.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.195.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.195.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.195.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.196.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.196.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.196.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.197.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.197.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.197.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.198.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.198.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.198.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.199.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.199.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.199.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.2.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.2.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.2.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.20.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.20.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.20.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.200.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.200.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.200.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.201.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.201.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.201.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.202.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.202.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.202.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.203.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.203.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.203.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.204.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.204.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.204.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.205.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.205.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.205.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.206.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.206.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.206.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.207.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.207.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.207.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.208.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.208.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.208.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.209.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.209.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.209.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.21.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.21.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.21.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.210.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.210.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.210.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.211.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.211.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.211.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.212.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.212.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.212.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.213.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.213.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.213.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.214.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.214.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.214.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.215.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.215.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.215.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.216.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.216.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.216.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.217.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.217.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.217.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.218.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.218.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.218.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.219.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.219.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.219.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.22.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.22.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.22.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.220.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.220.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.220.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.221.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.221.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.221.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.222.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.222.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.222.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.223.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.223.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.223.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.224.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.224.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.224.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.225.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.225.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.225.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.226.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.226.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.226.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.227.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.227.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.227.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.228.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.228.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.228.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.229.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.229.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.229.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.23.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.23.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.23.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.230.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.230.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.230.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.231.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.231.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.231.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.232.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.232.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.232.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.233.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.233.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.233.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.234.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.234.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.234.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.235.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.235.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.235.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.236.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.236.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.236.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.237.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.237.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.237.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.238.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.238.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.238.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.239.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.239.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.239.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.24.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.24.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.24.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.240.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.240.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.240.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.241.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.241.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.241.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.242.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.242.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.242.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.243.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.243.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.243.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.244.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.244.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.244.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.245.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.245.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.245.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.246.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.246.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.246.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.247.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.247.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.247.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.248.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.248.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.248.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.249.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.249.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.249.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.25.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.25.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.25.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.250.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.250.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.250.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.251.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.251.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.251.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.252.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.252.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.252.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.253.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.253.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.253.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.254.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.254.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.254.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.255.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.255.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.255.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.26.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.26.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.26.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.27.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.27.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.27.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.28.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.28.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.28.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.29.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.29.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.29.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.3.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.3.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.3.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.30.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.30.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.30.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.31.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.31.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.31.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.32.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.32.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.32.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.33.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.33.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.33.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.34.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.34.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.34.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.35.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.35.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.35.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.36.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.36.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.36.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.37.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.37.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.37.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.38.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.38.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.38.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.39.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.39.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.39.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.4.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.4.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.4.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.40.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.40.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.40.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.41.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.41.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.41.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.42.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.42.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.42.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.43.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.43.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.43.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.44.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.44.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.44.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.45.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.45.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.45.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.46.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.46.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.46.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.47.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.47.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.47.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.48.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.48.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.48.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.49.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.49.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.49.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.5.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.5.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.5.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.50.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.50.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.50.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.51.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.51.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.51.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.52.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.52.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.52.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.53.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.53.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.53.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.54.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.54.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.54.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.55.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.55.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.55.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.56.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.56.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.56.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.57.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.57.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.57.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.58.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.58.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.58.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.59.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.59.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.59.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.6.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.6.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.6.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.60.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.60.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.60.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.61.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.61.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.61.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.62.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.62.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.62.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.63.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.63.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.63.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.64.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.64.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.64.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.65.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.65.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.65.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.66.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.66.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.66.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.67.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.67.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.67.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.68.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.68.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.68.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.69.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.69.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.69.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.7.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.7.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.7.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.70.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.70.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.70.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.71.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.71.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.71.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.72.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.72.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.72.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.73.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.73.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.73.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.74.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.74.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.74.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.75.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.75.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.75.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.76.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.76.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.76.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.77.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.77.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.77.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.78.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.78.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.78.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.79.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.79.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.79.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.8.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.8.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.8.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.80.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.80.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.80.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.81.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.81.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.81.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.82.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.82.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.82.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.83.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.83.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.83.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.84.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.84.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.84.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.85.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.85.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.85.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.86.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.86.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.86.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.87.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.87.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.87.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.88.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.88.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.88.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.89.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.89.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.89.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.9.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.9.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.9.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.90.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.90.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.90.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.91.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.91.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.91.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.92.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.92.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.92.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.93.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.93.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.93.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.94.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.94.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.94.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.95.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.95.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.95.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.96.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.96.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.96.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.97.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.97.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.97.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.98.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.98.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.98.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.99.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.99.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.experts.gate_up_proj_list.99.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.gate.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.shared_expert.down_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.shared_expert.down_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.shared_expert.down_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.shared_expert.gate_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.shared_expert.gate_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.shared_expert.gate_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.shared_expert.up_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.shared_expert.up_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.shared_expert.up_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.shared_expert_gate.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.shared_expert_gate.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.26.mlp.shared_expert_gate.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.26.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.27.input_layernorm.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.0.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.0.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.0.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.1.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.1.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.1.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.10.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.10.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.10.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.100.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.100.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.100.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.101.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.101.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.101.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.102.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.102.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.102.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.103.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.103.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.103.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.104.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.104.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.104.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.105.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.105.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.105.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.106.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.106.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.106.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.107.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.107.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.107.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.108.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.108.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.108.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.109.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.109.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.109.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.11.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.11.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.11.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.110.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.110.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.110.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.111.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.111.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.111.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.112.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.112.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.112.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.113.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.113.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.113.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.114.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.114.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.114.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.115.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.115.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.115.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.116.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.116.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.116.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.117.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.117.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.117.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.118.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.118.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.118.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.119.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.119.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.119.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.12.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.12.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.12.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.120.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.120.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.120.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.121.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.121.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.121.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.122.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.122.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.122.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.123.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.123.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.123.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.124.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.124.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.124.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.125.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.125.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.125.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.126.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.126.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.126.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.127.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.127.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.127.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.128.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.128.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.128.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.129.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.129.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.129.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.13.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.13.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.13.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.130.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.130.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.130.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.131.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.131.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.131.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.132.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.132.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.132.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.133.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.133.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.133.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.134.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.134.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.134.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.135.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.135.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.135.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.136.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.136.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.136.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.137.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.137.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.137.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.138.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.138.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.138.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.139.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.139.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.139.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.14.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.14.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.14.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.140.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.140.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.140.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.141.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.141.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.141.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.142.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.142.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.142.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.143.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.143.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.143.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.144.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.144.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.144.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.145.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.145.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.145.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.146.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.146.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.146.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.147.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.147.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.147.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.148.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.148.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.148.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.149.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.149.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.149.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.15.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.15.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.15.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.150.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.150.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.150.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.151.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.151.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.151.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.152.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.152.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.152.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.153.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.153.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.153.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.154.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.154.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.154.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.155.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.155.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.155.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.156.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.156.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.156.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.157.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.157.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.157.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.158.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.158.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.158.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.159.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.159.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.159.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.16.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.16.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.16.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.160.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.160.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.160.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.161.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.161.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.161.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.162.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.162.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.162.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.163.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.163.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.163.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.164.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.164.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.164.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.165.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.165.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.165.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.166.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.166.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.166.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.167.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.167.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.167.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.168.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.168.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.168.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.169.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.169.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.169.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.17.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.17.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.17.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.170.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.170.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.170.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.171.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.171.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.171.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.172.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.172.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.172.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.173.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.173.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.173.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.174.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.174.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.174.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.175.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.175.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.175.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.176.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.176.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.176.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.177.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.177.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.177.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.178.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.178.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.178.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.179.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.179.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.179.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.18.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.18.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.18.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.180.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.180.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.180.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.181.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.181.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.181.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.182.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.182.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.182.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.183.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.183.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.183.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.184.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.184.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.184.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.185.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.185.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.185.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.186.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.186.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.186.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.187.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.187.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.187.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.188.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.188.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.188.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.189.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.189.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.189.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.19.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.19.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.19.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.190.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.190.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.190.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.191.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.191.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.191.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.192.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.192.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.192.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.193.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.193.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.193.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.194.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.194.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.194.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.195.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.195.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.195.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.196.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.196.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.196.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.197.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.197.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.197.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.198.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.198.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.198.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.199.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.199.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.199.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.2.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.2.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.2.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.20.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.20.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.20.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.200.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.200.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.200.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.201.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.201.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.201.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.202.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.202.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.202.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.203.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.203.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.203.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.204.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.204.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.204.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.205.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.205.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.205.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.206.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.206.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.206.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.207.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.207.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.207.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.208.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.208.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.208.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.209.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.209.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.209.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.21.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.21.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.21.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.210.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.210.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.210.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.211.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.211.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.211.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.212.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.212.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.212.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.213.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.213.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.213.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.214.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.214.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.214.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.215.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.215.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.215.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.216.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.216.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.216.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.217.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.217.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.217.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.218.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.218.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.218.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.219.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.219.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.219.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.22.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.22.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.22.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.220.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.220.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.220.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.221.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.221.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.221.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.222.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.222.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.222.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.223.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.223.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.223.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.224.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.224.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.224.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.225.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.225.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.225.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.226.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.226.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.226.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.227.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.227.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.227.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.228.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.228.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.228.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.229.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.229.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.229.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.23.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.23.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.23.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.230.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.230.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.230.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.231.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.231.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.231.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.232.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.232.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.232.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.233.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.233.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.233.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.234.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.234.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.234.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.235.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.235.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.235.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.236.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.236.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.236.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.237.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.237.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.237.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.238.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.238.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.238.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.239.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.239.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.239.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.24.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.24.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.24.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.240.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.240.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.240.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.241.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.241.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.241.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.242.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.242.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.242.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.243.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.243.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.243.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.244.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.244.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.244.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.245.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.245.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.245.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.246.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.246.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.246.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.247.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.247.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.247.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.248.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.248.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.248.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.249.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.249.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.249.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.25.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.25.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.25.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.250.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.250.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.250.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.251.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.251.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.251.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.252.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.252.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.252.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.253.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.253.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.253.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.254.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.254.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.254.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.255.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.255.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.255.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.26.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.26.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.26.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.27.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.27.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.27.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.28.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.28.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.28.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.29.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.29.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.29.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.3.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.3.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.3.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.30.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.30.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.30.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.31.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.31.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.31.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.32.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.32.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.32.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.33.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.33.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.33.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.34.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.34.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.34.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.35.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.35.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.35.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.36.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.36.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.36.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.37.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.37.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.37.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.38.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.38.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.38.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.39.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.39.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.39.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.4.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.4.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.4.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.40.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.40.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.40.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.41.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.41.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.41.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.42.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.42.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.42.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.43.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.43.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.43.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.44.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.44.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.44.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.45.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.45.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.45.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.46.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.46.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.46.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.47.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.47.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.47.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.48.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.48.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.48.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.49.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.49.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.49.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.5.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.5.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.5.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.50.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.50.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.50.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.51.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.51.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.51.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.52.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.52.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.52.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.53.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.53.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.53.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.54.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.54.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.54.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.55.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.55.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.55.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.56.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.56.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.56.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.57.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.57.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.57.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.58.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.58.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.58.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.59.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.59.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.59.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.6.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.6.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.6.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.60.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.60.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.60.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.61.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.61.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.61.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.62.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.62.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.62.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.63.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.63.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.63.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.64.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.64.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.64.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.65.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.65.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.65.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.66.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.66.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.66.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.67.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.67.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.67.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.68.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.68.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.68.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.69.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.69.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.69.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.7.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.7.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.7.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.70.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.70.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.70.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.71.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.71.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.71.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.72.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.72.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.72.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.73.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.73.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.73.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.74.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.74.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.74.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.75.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.75.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.75.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.76.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.76.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.76.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.77.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.77.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.77.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.78.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.78.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.78.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.79.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.79.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.79.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.8.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.8.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.8.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.80.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.80.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.80.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.81.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.81.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.81.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.82.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.82.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.82.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.83.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.83.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.83.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.84.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.84.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.84.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.85.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.85.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.85.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.86.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.86.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.86.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.87.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.87.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.87.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.88.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.88.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.88.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.89.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.89.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.89.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.9.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.9.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.9.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.90.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.90.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.90.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.91.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.91.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.91.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.92.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.92.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.92.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.93.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.93.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.93.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.94.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.94.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.94.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.95.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.95.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.95.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.96.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.96.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.96.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.97.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.97.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.97.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.98.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.98.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.98.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.99.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.99.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.down_proj_list.99.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.0.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.0.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.0.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.1.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.1.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.1.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.10.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.10.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.10.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.100.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.100.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.100.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.101.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.101.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.101.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.102.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.102.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.102.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.103.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.103.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.103.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.104.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.104.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.104.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.105.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.105.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.105.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.106.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.106.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.106.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.107.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.107.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.107.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.108.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.108.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.108.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.109.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.109.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.109.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.11.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.11.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.11.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.110.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.110.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.110.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.111.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.111.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.111.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.112.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.112.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.112.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.113.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.113.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.113.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.114.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.114.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.114.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.115.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.115.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.115.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.116.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.116.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.116.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.117.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.117.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.117.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.118.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.118.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.118.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.119.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.119.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.119.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.12.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.12.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.12.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.120.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.120.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.120.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.121.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.121.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.121.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.122.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.122.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.122.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.123.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.123.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.123.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.124.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.124.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.124.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.125.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.125.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.125.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.126.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.126.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.126.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.127.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.127.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.127.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.128.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.128.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.128.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.129.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.129.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.129.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.13.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.13.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.13.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.130.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.130.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.130.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.131.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.131.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.131.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.132.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.132.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.132.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.133.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.133.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.133.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.134.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.134.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.134.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.135.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.135.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.135.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.136.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.136.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.136.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.137.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.137.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.137.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.138.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.138.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.138.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.139.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.139.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.139.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.14.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.14.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.14.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.140.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.140.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.140.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.141.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.141.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.141.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.142.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.142.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.142.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.143.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.143.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.143.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.144.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.144.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.144.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.145.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.145.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.145.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.146.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.146.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.146.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.147.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.147.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.147.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.148.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.148.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.148.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.149.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.149.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.149.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.15.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.15.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.15.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.150.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.150.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.150.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.151.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.151.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.151.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.152.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.152.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.152.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.153.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.153.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.153.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.154.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.154.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.154.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.155.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.155.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.155.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.156.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.156.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.156.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.157.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.157.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.157.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.158.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.158.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.158.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.159.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.159.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.159.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.16.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.16.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.16.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.160.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.160.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.160.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.161.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.161.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.161.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.162.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.162.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.162.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.163.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.163.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.163.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.164.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.164.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.164.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.165.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.165.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.165.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.166.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.166.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.166.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.167.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.167.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.167.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.168.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.168.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.168.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.169.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.169.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.169.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.17.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.17.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.17.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.170.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.170.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.170.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.171.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.171.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.171.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.172.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.172.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.172.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.173.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.173.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.173.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.174.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.174.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.174.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.175.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.175.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.175.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.176.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.176.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.176.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.177.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.177.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.177.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.178.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.178.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.178.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.179.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.179.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.179.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.18.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.18.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.18.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.180.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.180.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.180.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.181.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.181.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.181.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.182.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.182.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.182.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.183.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.183.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.183.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.184.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.184.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.184.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.185.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.185.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.185.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.186.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.186.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.186.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.187.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.187.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.187.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.188.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.188.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.188.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.189.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.189.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.189.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.19.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.19.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.19.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.190.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.190.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.190.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.191.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.191.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.191.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.192.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.192.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.192.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.193.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.193.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.193.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.194.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.194.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.194.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.195.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.195.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.195.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.196.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.196.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.196.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.197.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.197.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.197.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.198.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.198.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.198.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.199.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.199.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.199.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.2.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.2.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.2.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.20.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.20.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.20.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.200.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.200.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.200.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.201.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.201.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.201.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.202.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.202.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.202.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.203.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.203.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.203.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.204.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.204.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.204.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.205.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.205.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.205.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.206.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.206.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.206.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.207.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.207.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.207.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.208.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.208.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.208.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.209.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.209.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.209.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.21.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.21.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.21.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.210.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.210.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.210.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.211.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.211.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.211.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.212.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.212.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.212.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.213.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.213.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.213.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.214.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.214.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.214.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.215.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.215.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.215.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.216.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.216.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.216.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.217.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.217.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.217.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.218.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.218.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.218.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.219.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.219.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.219.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.22.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.22.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.22.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.220.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.220.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.220.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.221.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.221.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.221.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.222.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.222.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.222.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.223.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.223.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.223.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.224.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.224.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.224.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.225.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.225.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.225.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.226.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.226.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.226.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.227.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.227.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.227.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.228.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.228.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.228.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.229.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.229.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.229.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.23.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.23.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.23.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.230.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.230.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.230.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.231.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.231.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.231.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.232.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.232.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.232.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.233.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.233.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.233.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.234.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.234.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.234.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.235.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.235.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.235.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.236.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.236.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.236.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.237.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.237.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.237.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.238.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.238.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.238.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.239.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.239.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.239.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.24.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.24.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.24.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.240.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.240.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.240.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.241.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.241.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.241.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.242.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.242.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.242.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.243.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.243.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.243.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.244.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.244.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.244.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.245.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.245.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.245.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.246.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.246.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.246.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.247.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.247.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.247.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.248.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.248.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.248.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.249.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.249.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.249.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.25.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.25.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.25.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.250.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.250.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.250.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.251.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.251.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.251.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.252.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.252.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.252.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.253.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.253.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.253.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.254.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.254.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.254.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.255.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.255.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.255.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.26.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.26.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.26.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.27.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.27.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.27.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.28.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.28.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.28.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.29.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.29.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.29.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.3.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.3.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.3.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.30.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.30.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.30.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.31.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.31.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.31.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.32.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.32.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.32.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.33.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.33.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.33.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.34.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.34.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.34.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.35.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.35.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.35.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.36.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.36.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.36.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.37.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.37.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.37.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.38.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.38.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.38.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.39.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.39.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.39.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.4.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.4.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.4.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.40.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.40.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.40.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.41.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.41.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.41.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.42.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.42.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.42.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.43.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.43.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.43.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.44.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.44.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.44.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.45.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.45.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.45.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.46.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.46.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.46.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.47.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.47.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.47.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.48.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.48.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.48.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.49.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.49.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.49.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.5.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.5.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.5.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.50.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.50.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.50.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.51.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.51.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.51.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.52.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.52.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.52.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.53.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.53.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.53.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.54.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.54.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.54.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.55.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.55.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.55.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.56.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.56.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.56.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.57.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.57.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.57.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.58.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.58.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.58.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.59.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.59.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.59.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.6.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.6.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.6.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.60.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.60.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.60.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.61.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.61.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.61.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.62.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.62.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.62.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.63.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.63.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.63.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.64.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.64.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.64.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.65.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.65.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.65.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.66.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.66.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.66.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.67.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.67.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.67.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.68.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.68.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.68.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.69.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.69.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.69.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.7.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.7.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.7.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.70.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.70.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.70.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.71.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.71.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.71.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.72.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.72.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.72.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.73.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.73.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.73.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.74.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.74.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.74.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.75.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.75.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.75.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.76.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.76.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.76.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.77.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.77.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.77.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.78.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.78.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.78.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.79.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.79.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.79.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.8.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.8.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.8.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.80.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.80.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.80.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.81.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.81.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.81.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.82.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.82.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.82.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.83.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.83.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.83.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.84.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.84.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.84.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.85.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.85.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.85.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.86.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.86.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.86.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.87.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.87.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.87.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.88.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.88.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.88.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.89.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.89.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.89.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.9.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.9.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.9.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.90.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.90.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.90.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.91.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.91.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.91.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.92.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.92.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.92.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.93.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.93.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.93.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.94.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.94.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.94.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.95.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.95.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.95.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.96.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.96.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.96.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.97.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.97.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.97.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.98.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.98.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.98.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.99.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.99.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.experts.gate_up_proj_list.99.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.gate.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.shared_expert.down_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.shared_expert.down_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.shared_expert.down_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.shared_expert.gate_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.shared_expert.gate_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.shared_expert.gate_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.shared_expert.up_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.shared_expert.up_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.shared_expert.up_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.shared_expert_gate.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.shared_expert_gate.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.mlp.shared_expert_gate.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.27.self_attn.k_norm.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.27.self_attn.k_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.self_attn.k_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.self_attn.k_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.self_attn.o_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.self_attn.o_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.self_attn.o_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.self_attn.q_norm.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.27.self_attn.q_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.self_attn.q_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.self_attn.q_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.27.self_attn.v_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.27.self_attn.v_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.27.self_attn.v_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.input_layernorm.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.28.linear_attn.A_log": "model-00003-of-00004.safetensors", "model.language_model.layers.28.linear_attn.conv1d.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.28.linear_attn.dt_bias": "model-00003-of-00004.safetensors", "model.language_model.layers.28.linear_attn.in_proj_a.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.linear_attn.in_proj_a.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.linear_attn.in_proj_a.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.linear_attn.in_proj_b.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.linear_attn.in_proj_b.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.linear_attn.in_proj_b.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.linear_attn.in_proj_qkv.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.linear_attn.in_proj_qkv.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.linear_attn.in_proj_qkv.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.linear_attn.in_proj_z.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.linear_attn.in_proj_z.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.linear_attn.in_proj_z.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.linear_attn.norm.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.28.linear_attn.out_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.linear_attn.out_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.linear_attn.out_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.0.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.0.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.0.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.1.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.1.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.1.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.10.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.10.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.10.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.100.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.100.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.100.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.101.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.101.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.101.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.102.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.102.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.102.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.103.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.103.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.103.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.104.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.104.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.104.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.105.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.105.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.105.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.106.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.106.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.106.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.107.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.107.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.107.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.108.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.108.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.108.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.109.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.109.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.109.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.11.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.11.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.11.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.110.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.110.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.110.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.111.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.111.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.111.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.112.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.112.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.112.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.113.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.113.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.113.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.114.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.114.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.114.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.115.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.115.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.115.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.116.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.116.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.116.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.117.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.117.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.117.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.118.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.118.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.118.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.119.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.119.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.119.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.12.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.12.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.12.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.120.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.120.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.120.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.121.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.121.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.121.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.122.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.122.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.122.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.123.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.123.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.123.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.124.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.124.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.124.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.125.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.125.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.125.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.126.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.126.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.126.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.127.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.127.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.127.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.128.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.128.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.128.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.129.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.129.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.129.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.13.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.13.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.13.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.130.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.130.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.130.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.131.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.131.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.131.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.132.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.132.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.132.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.133.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.133.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.133.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.134.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.134.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.134.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.135.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.135.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.135.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.136.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.136.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.136.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.137.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.137.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.137.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.138.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.138.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.138.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.139.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.139.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.139.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.14.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.14.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.14.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.140.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.140.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.140.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.141.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.141.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.141.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.142.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.142.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.142.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.143.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.143.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.143.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.144.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.144.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.144.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.145.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.145.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.145.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.146.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.146.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.146.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.147.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.147.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.147.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.148.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.148.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.148.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.149.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.149.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.149.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.15.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.15.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.15.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.150.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.150.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.150.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.151.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.151.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.151.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.152.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.152.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.152.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.153.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.153.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.153.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.154.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.154.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.154.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.155.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.155.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.155.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.156.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.156.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.156.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.157.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.157.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.157.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.158.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.158.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.158.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.159.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.159.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.159.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.16.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.16.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.16.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.160.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.160.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.160.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.161.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.161.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.161.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.162.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.162.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.162.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.163.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.163.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.163.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.164.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.164.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.164.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.165.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.165.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.165.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.166.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.166.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.166.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.167.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.167.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.167.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.168.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.168.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.168.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.169.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.169.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.169.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.17.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.17.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.17.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.170.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.170.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.170.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.171.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.171.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.171.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.172.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.172.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.172.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.173.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.173.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.173.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.174.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.174.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.174.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.175.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.175.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.175.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.176.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.176.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.176.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.177.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.177.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.177.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.178.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.178.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.178.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.179.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.179.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.179.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.18.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.18.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.18.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.180.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.180.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.180.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.181.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.181.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.181.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.182.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.182.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.182.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.183.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.183.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.183.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.184.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.184.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.184.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.185.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.185.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.185.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.186.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.186.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.186.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.187.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.187.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.187.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.188.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.188.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.188.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.189.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.189.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.189.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.19.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.19.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.19.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.190.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.190.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.190.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.191.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.191.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.191.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.192.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.192.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.192.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.193.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.193.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.193.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.194.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.194.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.194.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.195.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.195.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.195.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.196.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.196.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.196.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.197.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.197.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.197.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.198.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.198.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.198.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.199.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.199.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.199.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.2.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.2.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.2.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.20.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.20.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.20.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.200.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.200.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.200.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.201.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.201.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.201.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.202.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.202.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.202.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.203.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.203.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.203.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.204.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.204.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.204.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.205.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.205.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.205.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.206.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.206.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.206.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.207.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.207.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.207.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.208.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.208.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.208.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.209.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.209.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.209.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.21.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.21.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.21.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.210.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.210.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.210.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.211.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.211.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.211.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.212.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.212.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.212.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.213.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.213.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.213.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.214.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.214.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.214.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.215.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.215.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.215.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.216.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.216.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.216.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.217.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.217.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.217.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.218.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.218.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.218.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.219.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.219.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.219.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.22.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.22.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.22.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.220.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.220.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.220.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.221.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.221.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.221.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.222.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.222.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.222.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.223.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.223.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.223.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.224.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.224.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.224.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.225.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.225.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.225.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.226.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.226.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.226.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.227.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.227.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.227.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.228.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.228.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.228.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.229.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.229.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.229.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.23.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.23.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.23.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.230.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.230.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.230.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.231.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.231.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.231.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.232.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.232.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.232.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.233.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.233.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.233.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.234.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.234.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.234.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.235.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.235.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.235.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.236.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.236.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.236.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.237.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.237.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.237.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.238.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.238.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.238.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.239.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.239.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.239.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.24.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.24.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.24.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.240.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.240.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.240.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.241.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.241.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.241.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.242.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.242.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.242.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.243.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.243.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.243.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.244.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.244.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.244.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.245.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.245.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.245.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.246.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.246.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.246.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.247.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.247.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.247.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.248.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.248.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.248.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.249.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.249.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.249.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.25.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.25.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.25.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.250.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.250.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.250.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.251.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.251.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.251.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.252.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.252.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.252.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.253.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.253.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.253.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.254.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.254.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.254.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.255.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.255.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.255.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.26.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.26.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.26.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.27.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.27.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.27.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.28.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.28.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.28.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.29.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.29.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.29.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.3.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.3.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.3.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.30.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.30.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.30.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.31.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.31.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.31.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.32.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.32.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.32.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.33.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.33.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.33.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.34.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.34.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.34.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.35.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.35.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.35.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.36.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.36.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.36.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.37.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.37.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.37.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.38.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.38.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.38.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.39.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.39.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.39.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.4.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.4.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.4.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.40.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.40.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.40.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.41.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.41.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.41.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.42.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.42.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.42.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.43.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.43.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.43.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.44.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.44.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.44.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.45.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.45.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.45.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.46.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.46.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.46.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.47.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.47.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.47.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.48.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.48.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.48.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.49.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.49.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.49.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.5.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.5.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.5.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.50.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.50.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.50.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.51.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.51.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.51.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.52.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.52.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.52.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.53.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.53.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.53.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.54.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.54.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.54.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.55.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.55.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.55.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.56.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.56.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.56.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.57.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.57.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.57.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.58.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.58.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.58.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.59.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.59.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.59.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.6.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.6.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.6.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.60.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.60.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.60.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.61.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.61.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.61.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.62.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.62.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.62.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.63.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.63.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.63.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.64.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.64.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.64.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.65.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.65.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.65.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.66.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.66.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.66.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.67.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.67.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.67.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.68.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.68.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.68.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.69.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.69.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.69.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.7.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.7.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.7.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.70.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.70.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.70.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.71.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.71.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.71.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.72.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.72.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.72.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.73.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.73.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.73.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.74.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.74.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.74.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.75.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.75.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.75.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.76.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.76.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.76.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.77.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.77.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.77.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.78.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.78.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.78.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.79.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.79.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.79.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.8.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.8.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.8.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.80.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.80.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.80.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.81.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.81.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.81.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.82.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.82.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.82.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.83.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.83.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.83.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.84.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.84.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.84.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.85.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.85.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.85.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.86.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.86.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.86.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.87.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.87.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.87.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.88.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.88.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.88.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.89.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.89.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.89.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.9.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.9.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.9.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.90.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.90.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.90.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.91.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.91.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.91.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.92.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.92.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.92.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.93.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.93.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.93.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.94.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.94.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.94.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.95.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.95.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.95.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.96.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.96.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.96.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.97.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.97.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.97.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.98.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.98.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.98.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.99.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.99.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.down_proj_list.99.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.0.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.0.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.0.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.1.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.1.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.1.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.10.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.10.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.10.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.100.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.100.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.100.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.101.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.101.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.101.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.102.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.102.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.102.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.103.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.103.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.103.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.104.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.104.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.104.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.105.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.105.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.105.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.106.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.106.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.106.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.107.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.107.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.107.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.108.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.108.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.108.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.109.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.109.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.109.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.11.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.11.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.11.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.110.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.110.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.110.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.111.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.111.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.111.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.112.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.112.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.112.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.113.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.113.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.113.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.114.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.114.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.114.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.115.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.115.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.115.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.116.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.116.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.116.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.117.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.117.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.117.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.118.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.118.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.118.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.119.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.119.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.119.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.12.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.12.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.12.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.120.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.120.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.120.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.121.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.121.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.121.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.122.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.122.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.122.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.123.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.123.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.123.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.124.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.124.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.124.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.125.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.125.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.125.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.126.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.126.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.126.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.127.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.127.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.127.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.128.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.128.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.128.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.129.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.129.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.129.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.13.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.13.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.13.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.130.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.130.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.130.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.131.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.131.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.131.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.132.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.132.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.132.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.133.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.133.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.133.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.134.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.134.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.134.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.135.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.135.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.135.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.136.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.136.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.136.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.137.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.137.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.137.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.138.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.138.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.138.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.139.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.139.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.139.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.14.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.14.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.14.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.140.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.140.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.140.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.141.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.141.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.141.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.142.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.142.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.142.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.143.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.143.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.143.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.144.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.144.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.144.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.145.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.145.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.145.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.146.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.146.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.146.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.147.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.147.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.147.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.148.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.148.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.148.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.149.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.149.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.149.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.15.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.15.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.15.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.150.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.150.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.150.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.151.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.151.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.151.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.152.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.152.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.152.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.153.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.153.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.153.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.154.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.154.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.154.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.155.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.155.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.155.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.156.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.156.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.156.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.157.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.157.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.157.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.158.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.158.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.158.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.159.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.159.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.159.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.16.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.16.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.16.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.160.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.160.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.160.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.161.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.161.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.161.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.162.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.162.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.162.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.163.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.163.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.163.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.164.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.164.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.164.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.165.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.165.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.165.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.166.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.166.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.166.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.167.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.167.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.167.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.168.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.168.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.168.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.169.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.169.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.169.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.17.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.17.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.17.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.170.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.170.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.170.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.171.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.171.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.171.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.172.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.172.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.172.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.173.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.173.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.173.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.174.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.174.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.174.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.175.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.175.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.175.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.176.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.176.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.176.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.177.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.177.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.177.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.178.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.178.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.178.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.179.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.179.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.179.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.18.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.18.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.18.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.180.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.180.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.180.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.181.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.181.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.181.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.182.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.182.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.182.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.183.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.183.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.183.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.184.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.184.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.184.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.185.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.185.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.185.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.186.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.186.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.186.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.187.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.187.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.187.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.188.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.188.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.188.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.189.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.189.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.189.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.19.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.19.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.19.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.190.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.190.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.190.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.191.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.191.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.191.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.192.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.192.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.192.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.193.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.193.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.193.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.194.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.194.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.194.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.195.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.195.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.195.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.196.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.196.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.196.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.197.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.197.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.197.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.198.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.198.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.198.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.199.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.199.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.199.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.2.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.2.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.2.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.20.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.20.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.20.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.200.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.200.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.200.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.201.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.201.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.201.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.202.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.202.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.202.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.203.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.203.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.203.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.204.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.204.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.204.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.205.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.205.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.205.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.206.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.206.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.206.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.207.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.207.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.207.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.208.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.208.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.208.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.209.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.209.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.209.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.21.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.21.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.21.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.210.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.210.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.210.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.211.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.211.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.211.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.212.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.212.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.212.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.213.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.213.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.213.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.214.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.214.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.214.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.215.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.215.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.215.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.216.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.216.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.216.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.217.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.217.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.217.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.218.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.218.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.218.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.219.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.219.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.219.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.22.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.22.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.22.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.220.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.220.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.220.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.221.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.221.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.221.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.222.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.222.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.222.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.223.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.223.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.223.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.224.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.224.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.224.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.225.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.225.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.225.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.226.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.226.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.226.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.227.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.227.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.227.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.228.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.228.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.228.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.229.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.229.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.229.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.23.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.23.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.23.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.230.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.230.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.230.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.231.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.231.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.231.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.232.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.232.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.232.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.233.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.233.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.233.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.234.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.234.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.234.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.235.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.235.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.235.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.236.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.236.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.236.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.237.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.237.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.237.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.238.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.238.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.238.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.239.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.239.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.239.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.24.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.24.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.24.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.240.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.240.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.240.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.241.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.241.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.241.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.242.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.242.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.242.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.243.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.243.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.243.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.244.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.244.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.244.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.245.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.245.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.245.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.246.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.246.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.246.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.247.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.247.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.247.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.248.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.248.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.248.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.249.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.249.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.249.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.25.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.25.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.25.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.250.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.250.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.250.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.251.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.251.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.251.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.252.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.252.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.252.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.253.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.253.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.253.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.254.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.254.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.254.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.255.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.255.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.255.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.26.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.26.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.26.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.27.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.27.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.27.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.28.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.28.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.28.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.29.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.29.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.29.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.3.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.3.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.3.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.30.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.30.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.30.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.31.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.31.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.31.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.32.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.32.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.32.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.33.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.33.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.33.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.34.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.34.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.34.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.35.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.35.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.35.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.36.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.36.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.36.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.37.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.37.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.37.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.38.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.38.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.38.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.39.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.39.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.39.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.4.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.4.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.4.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.40.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.40.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.40.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.41.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.41.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.41.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.42.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.42.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.42.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.43.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.43.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.43.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.44.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.44.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.44.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.45.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.45.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.45.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.46.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.46.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.46.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.47.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.47.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.47.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.48.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.48.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.48.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.49.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.49.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.49.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.5.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.5.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.5.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.50.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.50.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.50.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.51.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.51.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.51.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.52.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.52.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.52.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.53.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.53.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.53.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.54.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.54.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.54.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.55.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.55.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.55.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.56.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.56.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.56.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.57.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.57.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.57.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.58.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.58.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.58.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.59.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.59.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.59.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.6.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.6.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.6.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.60.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.60.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.60.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.61.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.61.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.61.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.62.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.62.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.62.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.63.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.63.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.63.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.64.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.64.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.64.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.65.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.65.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.65.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.66.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.66.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.66.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.67.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.67.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.67.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.68.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.68.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.68.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.69.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.69.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.69.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.7.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.7.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.7.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.70.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.70.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.70.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.71.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.71.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.71.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.72.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.72.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.72.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.73.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.73.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.73.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.74.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.74.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.74.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.75.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.75.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.75.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.76.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.76.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.76.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.77.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.77.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.77.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.78.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.78.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.78.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.79.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.79.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.79.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.8.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.8.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.8.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.80.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.80.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.80.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.81.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.81.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.81.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.82.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.82.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.82.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.83.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.83.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.83.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.84.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.84.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.84.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.85.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.85.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.85.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.86.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.86.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.86.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.87.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.87.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.87.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.88.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.88.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.88.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.89.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.89.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.89.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.9.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.9.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.9.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.90.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.90.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.90.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.91.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.91.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.91.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.92.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.92.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.92.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.93.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.93.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.93.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.94.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.94.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.94.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.95.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.95.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.95.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.96.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.96.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.96.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.97.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.97.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.97.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.98.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.98.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.98.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.99.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.99.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.experts.gate_up_proj_list.99.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.gate.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.shared_expert.down_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.shared_expert.down_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.shared_expert.down_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.shared_expert.gate_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.shared_expert.gate_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.shared_expert.gate_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.shared_expert.up_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.shared_expert.up_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.shared_expert.up_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.shared_expert_gate.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.shared_expert_gate.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.28.mlp.shared_expert_gate.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.28.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.29.input_layernorm.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.29.linear_attn.A_log": "model-00003-of-00004.safetensors", "model.language_model.layers.29.linear_attn.conv1d.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.29.linear_attn.dt_bias": "model-00003-of-00004.safetensors", "model.language_model.layers.29.linear_attn.in_proj_a.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.linear_attn.in_proj_a.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.linear_attn.in_proj_a.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.linear_attn.in_proj_b.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.linear_attn.in_proj_b.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.linear_attn.in_proj_b.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.linear_attn.in_proj_qkv.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.linear_attn.in_proj_qkv.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.linear_attn.in_proj_qkv.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.linear_attn.in_proj_z.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.linear_attn.in_proj_z.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.linear_attn.in_proj_z.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.linear_attn.norm.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.29.linear_attn.out_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.linear_attn.out_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.linear_attn.out_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.0.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.0.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.0.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.1.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.1.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.1.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.10.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.10.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.10.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.100.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.100.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.100.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.101.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.101.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.101.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.102.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.102.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.102.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.103.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.103.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.103.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.104.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.104.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.104.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.105.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.105.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.105.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.106.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.106.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.106.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.107.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.107.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.107.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.108.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.108.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.108.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.109.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.109.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.109.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.11.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.11.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.11.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.110.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.110.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.110.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.111.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.111.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.111.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.112.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.112.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.112.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.113.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.113.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.113.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.114.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.114.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.114.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.115.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.115.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.115.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.116.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.116.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.116.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.117.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.117.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.117.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.118.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.118.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.118.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.119.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.119.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.119.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.12.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.12.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.12.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.120.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.120.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.120.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.121.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.121.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.121.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.122.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.122.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.122.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.123.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.123.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.123.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.124.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.124.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.124.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.125.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.125.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.125.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.126.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.126.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.126.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.127.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.127.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.127.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.128.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.128.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.128.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.129.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.129.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.129.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.13.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.13.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.13.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.130.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.130.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.130.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.131.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.131.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.131.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.132.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.132.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.132.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.133.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.133.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.133.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.134.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.134.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.134.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.135.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.135.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.135.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.136.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.136.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.136.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.137.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.137.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.137.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.138.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.138.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.138.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.139.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.139.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.139.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.14.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.14.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.14.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.140.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.140.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.140.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.141.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.141.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.141.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.142.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.142.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.142.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.143.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.143.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.143.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.144.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.144.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.144.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.145.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.145.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.145.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.146.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.146.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.146.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.147.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.147.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.147.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.148.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.148.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.148.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.149.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.149.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.149.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.15.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.15.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.15.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.150.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.150.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.150.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.151.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.151.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.151.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.152.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.152.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.152.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.153.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.153.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.153.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.154.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.154.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.154.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.155.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.155.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.155.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.156.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.156.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.156.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.157.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.157.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.157.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.158.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.158.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.158.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.159.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.159.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.159.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.16.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.16.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.16.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.160.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.160.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.160.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.161.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.161.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.161.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.162.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.162.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.162.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.163.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.163.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.163.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.164.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.164.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.164.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.165.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.165.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.165.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.166.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.166.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.166.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.167.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.167.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.167.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.168.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.168.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.168.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.169.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.169.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.169.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.17.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.17.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.17.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.170.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.170.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.170.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.171.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.171.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.171.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.172.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.172.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.172.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.173.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.173.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.173.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.174.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.174.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.174.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.175.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.175.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.175.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.176.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.176.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.176.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.177.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.177.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.177.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.178.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.178.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.178.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.179.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.179.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.179.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.18.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.18.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.18.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.180.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.180.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.180.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.181.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.181.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.181.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.182.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.182.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.182.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.183.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.183.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.183.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.184.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.184.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.184.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.185.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.185.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.185.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.186.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.186.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.186.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.187.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.187.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.187.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.188.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.188.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.188.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.189.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.189.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.189.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.19.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.19.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.19.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.190.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.190.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.190.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.191.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.191.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.191.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.192.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.192.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.192.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.193.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.193.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.193.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.194.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.194.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.194.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.195.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.195.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.195.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.196.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.196.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.196.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.197.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.197.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.197.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.198.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.198.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.198.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.199.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.199.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.199.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.2.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.2.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.2.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.20.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.20.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.20.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.200.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.200.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.200.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.201.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.201.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.201.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.202.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.202.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.202.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.203.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.203.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.203.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.204.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.204.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.204.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.205.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.205.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.205.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.206.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.206.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.206.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.207.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.207.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.207.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.208.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.208.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.208.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.209.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.209.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.209.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.21.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.21.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.21.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.210.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.210.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.210.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.211.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.211.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.211.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.212.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.212.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.212.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.213.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.213.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.213.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.214.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.214.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.214.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.215.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.215.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.215.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.216.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.216.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.216.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.217.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.217.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.217.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.218.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.218.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.218.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.219.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.219.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.219.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.22.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.22.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.22.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.220.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.220.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.220.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.221.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.221.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.221.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.222.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.222.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.222.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.223.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.223.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.223.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.224.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.224.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.224.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.225.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.225.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.225.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.226.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.226.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.226.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.227.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.227.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.227.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.228.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.228.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.228.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.229.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.229.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.229.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.23.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.23.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.23.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.230.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.230.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.230.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.231.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.231.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.231.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.232.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.232.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.232.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.233.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.233.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.233.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.234.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.234.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.234.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.235.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.235.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.235.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.236.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.236.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.236.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.237.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.237.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.237.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.238.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.238.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.238.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.239.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.239.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.239.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.24.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.24.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.24.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.240.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.240.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.240.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.241.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.241.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.241.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.242.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.242.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.242.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.243.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.243.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.243.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.244.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.244.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.244.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.245.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.245.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.245.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.246.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.246.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.246.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.247.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.247.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.247.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.248.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.248.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.248.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.249.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.249.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.249.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.25.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.25.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.25.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.250.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.250.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.250.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.251.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.251.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.251.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.252.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.252.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.252.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.253.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.253.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.253.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.254.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.254.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.254.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.255.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.255.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.255.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.26.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.26.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.26.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.27.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.27.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.27.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.28.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.28.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.28.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.29.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.29.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.29.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.3.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.3.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.3.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.30.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.30.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.30.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.31.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.31.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.31.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.32.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.32.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.32.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.33.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.33.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.33.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.34.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.34.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.34.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.35.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.35.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.35.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.36.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.36.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.36.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.37.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.37.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.37.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.38.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.38.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.38.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.39.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.39.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.39.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.4.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.4.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.4.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.40.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.40.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.40.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.41.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.41.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.41.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.42.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.42.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.42.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.43.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.43.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.43.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.44.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.44.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.44.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.45.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.45.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.45.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.46.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.46.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.46.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.47.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.47.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.47.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.48.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.48.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.48.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.49.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.49.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.49.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.5.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.5.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.5.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.50.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.50.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.50.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.51.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.51.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.51.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.52.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.52.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.52.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.53.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.53.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.53.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.54.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.54.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.54.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.55.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.55.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.55.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.56.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.56.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.56.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.57.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.57.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.57.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.58.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.58.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.58.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.59.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.59.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.59.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.6.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.6.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.6.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.60.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.60.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.60.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.61.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.61.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.61.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.62.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.62.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.62.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.63.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.63.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.63.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.64.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.64.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.64.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.65.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.65.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.65.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.66.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.66.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.66.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.67.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.67.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.67.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.68.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.68.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.68.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.69.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.69.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.69.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.7.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.7.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.7.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.70.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.70.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.70.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.71.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.71.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.71.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.72.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.72.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.72.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.73.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.73.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.73.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.74.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.74.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.74.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.75.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.75.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.75.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.76.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.76.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.76.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.77.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.77.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.77.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.78.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.78.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.78.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.79.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.79.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.79.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.8.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.8.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.8.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.80.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.80.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.80.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.81.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.81.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.81.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.82.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.82.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.82.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.83.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.83.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.83.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.84.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.84.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.84.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.85.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.85.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.85.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.86.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.86.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.86.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.87.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.87.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.87.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.88.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.88.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.88.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.89.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.89.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.89.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.9.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.9.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.9.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.90.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.90.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.90.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.91.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.91.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.91.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.92.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.92.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.92.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.93.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.93.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.93.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.94.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.94.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.94.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.95.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.95.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.95.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.96.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.96.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.96.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.97.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.97.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.97.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.98.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.98.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.98.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.99.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.99.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.down_proj_list.99.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.0.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.0.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.0.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.1.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.1.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.1.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.10.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.10.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.10.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.100.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.100.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.100.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.101.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.101.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.101.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.102.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.102.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.102.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.103.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.103.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.103.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.104.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.104.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.104.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.105.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.105.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.105.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.106.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.106.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.106.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.107.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.107.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.107.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.108.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.108.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.108.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.109.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.109.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.109.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.11.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.11.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.11.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.110.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.110.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.110.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.111.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.111.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.111.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.112.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.112.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.112.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.113.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.113.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.113.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.114.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.114.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.114.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.115.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.115.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.115.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.116.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.116.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.116.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.117.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.117.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.117.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.118.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.118.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.118.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.119.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.119.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.119.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.12.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.12.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.12.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.120.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.120.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.120.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.121.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.121.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.121.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.122.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.122.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.122.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.123.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.123.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.123.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.124.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.124.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.124.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.125.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.125.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.125.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.126.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.126.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.126.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.127.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.127.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.127.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.128.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.128.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.128.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.129.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.129.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.129.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.13.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.13.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.13.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.130.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.130.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.130.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.131.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.131.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.131.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.132.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.132.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.132.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.133.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.133.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.133.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.134.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.134.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.134.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.135.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.135.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.135.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.136.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.136.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.136.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.137.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.137.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.137.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.138.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.138.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.138.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.139.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.139.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.139.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.14.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.14.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.14.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.140.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.140.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.140.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.141.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.141.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.141.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.142.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.142.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.142.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.143.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.143.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.143.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.144.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.144.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.144.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.145.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.145.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.145.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.146.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.146.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.146.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.147.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.147.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.147.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.148.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.148.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.148.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.149.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.149.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.149.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.15.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.15.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.15.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.150.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.150.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.150.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.151.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.151.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.151.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.152.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.152.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.152.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.153.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.153.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.153.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.154.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.154.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.154.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.155.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.155.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.155.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.156.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.156.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.156.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.157.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.157.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.157.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.158.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.158.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.158.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.159.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.159.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.159.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.16.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.16.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.16.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.160.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.160.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.160.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.161.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.161.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.161.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.162.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.162.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.162.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.163.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.163.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.163.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.164.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.164.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.164.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.165.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.165.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.165.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.166.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.166.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.166.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.167.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.167.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.167.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.168.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.168.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.168.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.169.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.169.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.169.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.17.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.17.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.17.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.170.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.170.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.170.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.171.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.171.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.171.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.172.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.172.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.172.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.173.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.173.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.173.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.174.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.174.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.174.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.175.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.175.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.175.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.176.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.176.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.176.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.177.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.177.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.177.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.178.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.178.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.178.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.179.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.179.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.179.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.18.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.18.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.18.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.180.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.180.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.180.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.181.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.181.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.181.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.182.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.182.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.182.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.183.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.183.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.183.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.184.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.184.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.184.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.185.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.185.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.185.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.186.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.186.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.186.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.187.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.187.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.187.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.188.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.188.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.188.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.189.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.189.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.189.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.19.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.19.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.19.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.190.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.190.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.190.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.191.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.191.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.191.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.192.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.192.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.192.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.193.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.193.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.193.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.194.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.194.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.194.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.195.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.195.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.195.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.196.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.196.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.196.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.197.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.197.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.197.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.198.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.198.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.198.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.199.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.199.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.199.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.2.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.2.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.2.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.20.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.20.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.20.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.200.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.200.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.200.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.201.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.201.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.201.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.202.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.202.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.202.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.203.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.203.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.203.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.204.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.204.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.204.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.205.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.205.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.205.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.206.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.206.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.206.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.207.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.207.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.207.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.208.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.208.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.208.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.209.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.209.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.209.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.21.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.21.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.21.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.210.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.210.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.210.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.211.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.211.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.211.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.212.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.212.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.212.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.213.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.213.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.213.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.214.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.214.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.214.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.215.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.215.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.215.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.216.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.216.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.216.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.217.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.217.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.217.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.218.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.218.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.218.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.219.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.219.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.219.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.22.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.22.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.22.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.220.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.220.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.220.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.221.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.221.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.221.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.222.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.222.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.222.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.223.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.223.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.223.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.224.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.224.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.224.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.225.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.225.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.225.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.226.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.226.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.226.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.227.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.227.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.227.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.228.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.228.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.228.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.229.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.229.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.229.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.23.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.23.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.23.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.230.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.230.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.230.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.231.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.231.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.231.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.232.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.232.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.232.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.233.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.233.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.233.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.234.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.234.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.234.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.235.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.235.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.235.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.236.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.236.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.236.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.237.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.237.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.237.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.238.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.238.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.238.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.239.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.239.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.239.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.24.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.24.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.24.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.240.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.240.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.240.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.241.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.241.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.241.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.242.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.242.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.242.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.243.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.243.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.243.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.244.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.244.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.244.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.245.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.245.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.245.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.246.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.246.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.246.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.247.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.247.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.247.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.248.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.248.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.248.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.249.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.249.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.249.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.25.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.25.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.25.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.250.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.250.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.250.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.251.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.251.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.251.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.252.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.252.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.252.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.253.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.253.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.253.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.254.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.254.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.254.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.255.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.255.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.255.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.26.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.26.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.26.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.27.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.27.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.27.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.28.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.28.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.28.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.29.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.29.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.29.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.3.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.3.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.3.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.30.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.30.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.30.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.31.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.31.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.31.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.32.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.32.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.32.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.33.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.33.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.33.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.34.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.34.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.34.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.35.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.35.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.35.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.36.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.36.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.36.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.37.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.37.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.37.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.38.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.38.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.38.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.39.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.39.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.39.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.4.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.4.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.4.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.40.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.40.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.40.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.41.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.41.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.41.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.42.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.42.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.42.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.43.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.43.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.43.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.44.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.44.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.44.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.45.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.45.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.45.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.46.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.46.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.46.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.47.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.47.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.47.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.48.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.48.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.48.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.49.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.49.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.49.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.5.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.5.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.5.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.50.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.50.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.50.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.51.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.51.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.51.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.52.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.52.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.52.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.53.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.53.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.53.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.54.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.54.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.54.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.55.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.55.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.55.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.56.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.56.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.56.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.57.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.57.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.57.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.58.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.58.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.58.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.59.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.59.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.59.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.6.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.6.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.6.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.60.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.60.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.60.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.61.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.61.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.61.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.62.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.62.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.62.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.63.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.63.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.63.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.64.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.64.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.64.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.65.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.65.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.65.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.66.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.66.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.66.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.67.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.67.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.67.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.68.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.68.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.68.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.69.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.69.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.69.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.7.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.7.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.7.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.70.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.70.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.70.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.71.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.71.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.71.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.72.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.72.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.72.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.73.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.73.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.73.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.74.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.74.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.74.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.75.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.75.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.75.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.76.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.76.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.76.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.77.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.77.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.77.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.78.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.78.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.78.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.79.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.79.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.79.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.8.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.8.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.8.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.80.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.80.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.80.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.81.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.81.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.81.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.82.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.82.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.82.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.83.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.83.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.83.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.84.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.84.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.84.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.85.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.85.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.85.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.86.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.86.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.86.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.87.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.87.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.87.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.88.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.88.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.88.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.89.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.89.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.89.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.9.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.9.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.9.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.90.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.90.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.90.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.91.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.91.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.91.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.92.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.92.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.92.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.93.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.93.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.93.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.94.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.94.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.94.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.95.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.95.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.95.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.96.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.96.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.96.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.97.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.97.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.97.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.98.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.98.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.98.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.99.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.99.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.experts.gate_up_proj_list.99.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.gate.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.shared_expert.down_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.shared_expert.down_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.shared_expert.down_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.shared_expert.gate_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.shared_expert.gate_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.shared_expert.gate_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.shared_expert.up_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.shared_expert.up_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.shared_expert.up_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.shared_expert_gate.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.shared_expert_gate.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.29.mlp.shared_expert_gate.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.29.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.3.input_layernorm.weight": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.0.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.0.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.0.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.1.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.1.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.1.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.10.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.10.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.10.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.100.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.100.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.100.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.101.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.101.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.101.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.102.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.102.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.102.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.103.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.103.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.103.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.104.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.104.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.104.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.105.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.105.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.105.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.106.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.106.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.106.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.107.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.107.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.107.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.108.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.108.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.108.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.109.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.109.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.109.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.11.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.11.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.11.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.110.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.110.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.110.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.111.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.111.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.111.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.112.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.112.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.112.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.113.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.113.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.113.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.114.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.114.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.114.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.115.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.115.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.115.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.116.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.116.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.116.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.117.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.117.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.117.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.118.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.118.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.118.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.119.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.119.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.119.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.12.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.12.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.12.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.120.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.120.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.120.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.121.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.121.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.121.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.122.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.122.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.122.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.123.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.123.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.123.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.124.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.124.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.124.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.125.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.125.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.125.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.126.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.126.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.126.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.127.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.127.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.127.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.128.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.128.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.128.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.129.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.129.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.129.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.13.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.13.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.13.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.130.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.130.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.130.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.131.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.131.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.131.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.132.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.132.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.132.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.133.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.133.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.133.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.134.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.134.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.134.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.135.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.135.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.135.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.136.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.136.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.136.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.137.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.137.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.137.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.138.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.138.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.138.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.139.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.139.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.139.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.14.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.14.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.14.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.140.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.140.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.140.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.141.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.141.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.141.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.142.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.142.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.142.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.143.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.143.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.143.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.144.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.144.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.144.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.145.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.145.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.145.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.146.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.146.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.146.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.147.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.147.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.147.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.148.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.148.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.148.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.149.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.149.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.149.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.15.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.15.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.15.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.150.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.150.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.150.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.151.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.151.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.151.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.152.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.152.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.152.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.153.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.153.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.153.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.154.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.154.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.154.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.155.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.155.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.155.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.156.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.156.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.156.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.157.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.157.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.157.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.158.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.158.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.158.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.159.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.159.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.159.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.16.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.16.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.16.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.160.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.160.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.160.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.161.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.161.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.161.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.162.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.162.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.162.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.163.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.163.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.163.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.164.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.164.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.164.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.165.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.165.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.165.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.166.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.166.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.166.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.167.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.167.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.167.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.168.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.168.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.168.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.169.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.169.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.169.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.17.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.17.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.17.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.170.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.170.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.170.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.171.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.171.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.171.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.172.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.172.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.172.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.173.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.173.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.173.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.174.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.174.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.174.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.175.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.175.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.175.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.176.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.176.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.176.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.177.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.177.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.177.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.178.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.178.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.178.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.179.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.179.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.179.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.18.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.18.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.18.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.180.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.180.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.180.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.181.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.181.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.181.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.182.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.182.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.182.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.183.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.183.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.183.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.184.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.184.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.184.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.185.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.185.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.185.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.186.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.186.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.186.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.187.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.187.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.187.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.188.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.188.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.188.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.189.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.189.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.189.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.19.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.19.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.19.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.190.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.190.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.190.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.191.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.191.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.191.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.192.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.192.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.192.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.193.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.193.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.193.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.194.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.194.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.194.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.195.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.195.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.195.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.196.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.196.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.196.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.197.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.197.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.197.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.198.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.198.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.198.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.199.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.199.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.199.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.2.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.2.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.2.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.20.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.20.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.20.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.200.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.200.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.200.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.201.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.201.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.201.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.202.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.202.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.202.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.203.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.203.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.203.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.204.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.204.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.204.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.205.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.205.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.205.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.206.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.206.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.206.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.207.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.207.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.207.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.208.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.208.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.208.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.209.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.209.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.209.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.21.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.21.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.21.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.210.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.210.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.210.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.211.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.211.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.211.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.212.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.212.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.212.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.213.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.213.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.213.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.214.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.214.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.214.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.215.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.215.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.215.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.216.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.216.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.216.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.217.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.217.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.217.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.218.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.218.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.218.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.219.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.219.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.219.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.22.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.22.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.22.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.220.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.220.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.220.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.221.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.221.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.221.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.222.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.222.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.222.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.223.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.223.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.223.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.224.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.224.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.224.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.225.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.225.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.225.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.226.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.226.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.226.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.227.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.227.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.227.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.228.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.228.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.228.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.229.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.229.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.229.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.23.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.23.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.23.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.230.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.230.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.230.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.231.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.231.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.231.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.232.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.232.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.232.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.233.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.233.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.233.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.234.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.234.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.234.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.235.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.235.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.235.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.236.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.236.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.236.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.237.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.237.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.237.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.238.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.238.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.238.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.239.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.239.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.239.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.24.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.24.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.24.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.240.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.240.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.240.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.241.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.241.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.241.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.242.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.242.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.242.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.243.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.243.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.243.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.244.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.244.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.244.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.245.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.245.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.245.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.246.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.246.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.246.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.247.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.247.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.247.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.248.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.248.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.248.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.249.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.249.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.249.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.25.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.25.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.25.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.250.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.250.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.250.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.251.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.251.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.251.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.252.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.252.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.252.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.253.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.253.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.253.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.254.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.254.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.254.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.255.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.255.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.255.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.26.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.26.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.26.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.27.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.27.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.27.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.28.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.28.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.28.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.29.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.29.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.29.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.3.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.3.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.3.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.30.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.30.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.30.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.31.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.31.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.31.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.32.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.32.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.32.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.33.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.33.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.33.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.34.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.34.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.34.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.35.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.35.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.35.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.36.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.36.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.36.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.37.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.37.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.37.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.38.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.38.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.38.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.39.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.39.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.39.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.4.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.4.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.4.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.40.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.40.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.40.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.41.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.41.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.41.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.42.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.42.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.42.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.43.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.43.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.43.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.44.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.44.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.44.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.45.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.45.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.45.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.46.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.46.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.46.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.47.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.47.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.47.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.48.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.48.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.48.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.49.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.49.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.49.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.5.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.5.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.5.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.50.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.50.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.50.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.51.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.51.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.51.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.52.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.52.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.52.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.53.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.53.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.53.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.54.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.54.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.54.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.55.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.55.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.55.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.56.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.56.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.56.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.57.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.57.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.57.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.58.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.58.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.58.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.59.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.59.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.59.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.6.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.6.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.6.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.60.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.60.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.60.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.61.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.61.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.61.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.62.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.62.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.62.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.63.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.63.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.63.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.64.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.64.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.64.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.65.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.65.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.65.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.66.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.66.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.66.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.67.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.67.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.67.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.68.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.68.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.68.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.69.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.69.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.69.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.7.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.7.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.7.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.70.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.70.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.70.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.71.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.71.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.71.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.72.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.72.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.72.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.73.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.73.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.73.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.74.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.74.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.74.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.75.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.75.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.75.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.76.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.76.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.76.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.77.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.77.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.77.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.78.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.78.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.78.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.79.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.79.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.79.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.8.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.8.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.8.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.80.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.80.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.80.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.81.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.81.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.81.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.82.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.82.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.82.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.83.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.83.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.83.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.84.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.84.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.84.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.85.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.85.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.85.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.86.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.86.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.86.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.87.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.87.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.87.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.88.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.88.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.88.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.89.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.89.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.89.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.9.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.9.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.9.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.90.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.90.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.90.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.91.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.91.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.91.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.92.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.92.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.92.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.93.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.93.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.93.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.94.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.94.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.94.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.95.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.95.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.95.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.96.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.96.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.96.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.97.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.97.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.97.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.98.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.98.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.98.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.99.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.99.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.down_proj_list.99.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.0.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.0.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.0.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.1.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.1.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.1.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.10.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.10.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.10.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.100.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.100.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.100.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.101.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.101.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.101.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.102.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.102.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.102.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.103.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.103.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.103.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.104.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.104.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.104.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.105.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.105.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.105.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.106.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.106.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.106.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.107.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.107.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.107.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.108.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.108.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.108.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.109.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.109.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.109.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.11.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.11.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.11.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.110.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.110.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.110.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.111.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.111.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.111.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.112.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.112.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.112.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.113.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.113.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.113.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.114.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.114.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.114.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.115.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.115.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.115.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.116.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.116.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.116.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.117.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.117.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.117.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.118.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.118.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.118.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.119.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.119.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.119.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.12.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.12.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.12.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.120.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.120.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.120.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.121.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.121.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.121.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.122.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.122.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.122.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.123.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.123.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.123.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.124.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.124.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.124.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.125.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.125.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.125.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.126.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.126.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.126.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.127.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.127.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.127.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.128.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.128.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.128.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.129.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.129.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.129.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.13.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.13.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.13.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.130.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.130.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.130.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.131.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.131.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.131.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.132.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.132.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.132.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.133.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.133.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.133.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.134.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.134.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.134.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.135.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.135.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.135.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.136.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.136.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.136.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.137.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.137.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.137.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.138.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.138.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.138.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.139.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.139.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.139.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.14.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.14.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.14.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.140.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.140.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.140.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.141.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.141.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.141.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.142.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.142.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.142.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.143.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.143.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.143.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.144.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.144.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.144.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.145.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.145.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.145.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.146.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.146.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.146.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.147.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.147.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.147.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.148.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.148.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.148.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.149.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.149.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.149.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.15.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.15.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.15.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.150.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.150.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.150.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.151.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.151.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.151.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.152.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.152.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.152.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.153.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.153.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.153.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.154.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.154.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.154.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.155.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.155.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.155.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.156.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.156.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.156.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.157.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.157.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.157.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.158.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.158.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.158.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.159.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.159.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.159.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.16.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.16.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.16.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.160.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.160.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.160.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.161.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.161.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.161.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.162.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.162.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.162.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.163.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.163.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.163.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.164.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.164.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.164.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.165.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.165.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.165.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.166.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.166.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.166.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.167.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.167.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.167.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.168.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.168.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.168.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.169.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.169.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.169.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.17.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.17.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.17.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.170.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.170.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.170.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.171.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.171.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.171.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.172.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.172.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.172.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.173.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.173.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.173.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.174.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.174.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.174.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.175.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.175.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.175.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.176.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.176.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.176.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.177.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.177.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.177.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.178.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.178.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.178.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.179.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.179.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.179.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.18.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.18.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.18.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.180.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.180.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.180.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.181.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.181.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.181.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.182.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.182.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.182.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.183.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.183.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.183.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.184.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.184.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.184.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.185.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.185.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.185.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.186.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.186.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.186.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.187.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.187.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.187.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.188.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.188.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.188.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.189.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.189.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.189.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.19.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.19.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.19.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.190.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.190.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.190.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.191.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.191.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.191.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.192.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.192.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.192.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.193.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.193.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.193.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.194.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.194.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.194.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.195.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.195.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.195.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.196.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.196.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.196.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.197.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.197.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.197.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.198.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.198.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.198.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.199.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.199.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.199.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.2.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.2.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.2.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.20.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.20.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.20.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.200.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.200.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.200.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.201.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.201.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.201.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.202.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.202.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.202.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.203.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.203.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.203.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.204.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.204.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.204.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.205.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.205.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.205.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.206.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.206.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.206.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.207.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.207.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.207.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.208.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.208.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.208.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.209.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.209.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.209.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.21.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.21.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.21.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.210.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.210.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.210.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.211.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.211.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.211.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.212.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.212.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.212.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.213.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.213.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.213.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.214.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.214.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.214.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.215.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.215.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.215.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.216.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.216.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.216.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.217.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.217.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.217.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.218.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.218.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.218.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.219.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.219.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.219.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.22.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.22.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.22.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.220.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.220.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.220.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.221.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.221.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.221.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.222.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.222.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.222.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.223.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.223.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.223.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.224.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.224.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.224.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.225.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.225.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.225.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.226.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.226.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.226.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.227.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.227.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.227.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.228.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.228.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.228.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.229.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.229.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.229.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.23.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.23.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.23.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.230.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.230.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.230.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.231.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.231.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.231.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.232.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.232.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.232.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.233.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.233.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.233.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.234.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.234.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.234.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.235.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.235.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.235.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.236.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.236.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.236.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.237.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.237.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.237.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.238.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.238.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.238.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.239.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.239.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.239.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.24.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.24.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.24.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.240.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.240.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.240.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.241.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.241.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.241.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.242.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.242.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.242.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.243.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.243.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.243.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.244.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.244.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.244.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.245.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.245.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.245.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.246.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.246.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.246.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.247.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.247.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.247.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.248.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.248.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.248.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.249.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.249.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.249.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.25.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.25.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.25.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.250.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.250.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.250.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.251.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.251.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.251.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.252.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.252.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.252.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.253.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.253.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.253.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.254.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.254.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.254.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.255.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.255.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.255.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.26.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.26.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.26.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.27.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.27.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.27.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.28.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.28.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.28.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.29.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.29.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.29.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.3.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.3.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.3.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.30.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.30.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.30.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.31.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.31.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.31.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.32.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.32.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.32.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.33.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.33.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.33.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.34.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.34.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.34.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.35.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.35.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.35.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.36.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.36.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.36.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.37.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.37.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.37.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.38.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.38.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.38.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.39.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.39.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.39.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.4.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.4.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.4.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.40.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.40.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.40.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.41.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.41.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.41.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.42.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.42.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.42.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.43.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.43.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.43.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.44.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.44.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.44.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.45.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.45.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.45.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.46.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.46.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.46.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.47.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.47.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.47.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.48.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.48.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.48.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.49.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.49.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.49.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.5.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.5.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.5.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.50.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.50.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.50.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.51.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.51.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.51.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.52.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.52.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.52.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.53.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.53.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.53.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.54.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.54.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.54.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.55.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.55.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.55.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.56.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.56.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.56.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.57.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.57.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.57.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.58.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.58.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.58.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.59.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.59.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.59.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.6.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.6.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.6.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.60.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.60.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.60.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.61.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.61.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.61.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.62.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.62.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.62.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.63.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.63.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.63.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.64.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.64.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.64.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.65.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.65.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.65.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.66.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.66.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.66.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.67.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.67.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.67.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.68.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.68.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.68.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.69.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.69.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.69.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.7.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.7.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.7.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.70.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.70.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.70.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.71.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.71.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.71.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.72.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.72.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.72.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.73.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.73.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.73.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.74.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.74.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.74.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.75.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.75.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.75.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.76.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.76.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.76.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.77.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.77.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.77.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.78.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.78.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.78.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.79.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.79.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.79.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.8.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.8.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.8.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.80.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.80.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.80.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.81.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.81.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.81.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.82.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.82.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.82.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.83.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.83.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.83.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.84.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.84.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.84.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.85.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.85.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.85.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.86.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.86.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.86.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.87.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.87.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.87.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.88.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.88.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.88.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.89.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.89.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.89.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.9.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.9.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.9.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.90.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.90.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.90.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.91.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.91.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.91.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.92.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.92.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.92.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.93.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.93.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.93.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.94.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.94.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.94.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.95.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.95.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.95.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.96.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.96.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.96.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.97.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.97.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.97.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.98.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.98.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.98.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.99.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.99.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.experts.gate_up_proj_list.99.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.gate.weight": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.shared_expert.down_proj.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.shared_expert.down_proj.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.shared_expert.down_proj.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.shared_expert.gate_proj.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.shared_expert.gate_proj.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.shared_expert.gate_proj.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.shared_expert.up_proj.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.shared_expert.up_proj.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.shared_expert.up_proj.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.shared_expert_gate.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.shared_expert_gate.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.mlp.shared_expert_gate.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.post_attention_layernorm.weight": "model-00001-of-00004.safetensors", "model.language_model.layers.3.self_attn.k_norm.weight": "model-00001-of-00004.safetensors", "model.language_model.layers.3.self_attn.k_proj.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.self_attn.k_proj.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.self_attn.k_proj.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.self_attn.o_proj.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.self_attn.o_proj.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.self_attn.o_proj.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.self_attn.q_norm.weight": "model-00001-of-00004.safetensors", "model.language_model.layers.3.self_attn.q_proj.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.self_attn.q_proj.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.self_attn.q_proj.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.3.self_attn.v_proj.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.3.self_attn.v_proj.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.3.self_attn.v_proj.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.30.input_layernorm.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.30.linear_attn.A_log": "model-00003-of-00004.safetensors", "model.language_model.layers.30.linear_attn.conv1d.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.30.linear_attn.dt_bias": "model-00003-of-00004.safetensors", "model.language_model.layers.30.linear_attn.in_proj_a.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.linear_attn.in_proj_a.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.linear_attn.in_proj_a.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.linear_attn.in_proj_b.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.linear_attn.in_proj_b.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.linear_attn.in_proj_b.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.linear_attn.in_proj_qkv.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.linear_attn.in_proj_qkv.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.linear_attn.in_proj_qkv.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.linear_attn.in_proj_z.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.linear_attn.in_proj_z.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.linear_attn.in_proj_z.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.linear_attn.norm.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.30.linear_attn.out_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.linear_attn.out_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.linear_attn.out_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.0.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.0.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.0.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.1.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.1.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.1.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.10.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.10.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.10.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.100.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.100.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.100.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.101.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.101.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.101.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.102.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.102.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.102.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.103.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.103.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.103.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.104.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.104.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.104.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.105.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.105.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.105.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.106.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.106.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.106.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.107.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.107.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.107.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.108.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.108.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.108.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.109.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.109.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.109.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.11.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.11.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.11.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.110.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.110.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.110.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.111.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.111.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.111.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.112.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.112.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.112.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.113.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.113.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.113.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.114.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.114.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.114.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.115.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.115.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.115.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.116.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.116.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.116.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.117.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.117.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.117.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.118.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.118.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.118.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.119.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.119.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.119.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.12.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.12.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.12.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.120.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.120.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.120.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.121.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.121.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.121.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.122.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.122.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.122.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.123.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.123.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.123.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.124.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.124.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.124.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.125.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.125.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.125.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.126.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.126.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.126.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.127.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.127.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.127.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.128.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.128.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.128.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.129.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.129.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.129.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.13.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.13.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.13.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.130.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.130.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.130.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.131.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.131.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.131.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.132.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.132.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.132.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.133.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.133.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.133.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.134.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.134.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.134.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.135.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.135.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.135.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.136.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.136.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.136.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.137.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.137.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.137.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.138.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.138.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.138.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.139.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.139.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.139.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.14.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.14.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.14.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.140.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.140.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.140.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.141.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.141.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.141.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.142.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.142.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.142.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.143.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.143.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.143.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.144.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.144.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.144.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.145.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.145.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.145.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.146.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.146.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.146.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.147.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.147.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.147.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.148.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.148.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.148.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.149.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.149.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.149.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.15.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.15.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.15.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.150.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.150.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.150.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.151.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.151.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.151.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.152.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.152.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.152.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.153.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.153.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.153.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.154.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.154.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.154.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.155.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.155.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.155.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.156.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.156.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.156.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.157.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.157.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.157.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.158.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.158.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.158.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.159.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.159.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.159.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.16.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.16.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.16.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.160.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.160.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.160.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.161.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.161.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.161.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.162.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.162.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.162.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.163.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.163.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.163.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.164.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.164.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.164.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.165.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.165.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.165.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.166.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.166.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.166.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.167.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.167.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.167.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.168.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.168.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.168.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.169.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.169.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.169.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.17.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.17.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.17.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.170.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.170.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.170.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.171.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.171.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.171.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.172.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.172.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.172.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.173.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.173.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.173.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.174.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.174.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.174.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.175.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.175.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.175.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.176.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.176.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.176.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.177.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.177.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.177.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.178.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.178.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.178.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.179.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.179.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.179.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.18.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.18.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.18.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.180.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.180.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.180.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.181.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.181.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.181.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.182.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.182.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.182.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.183.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.183.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.183.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.184.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.184.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.184.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.185.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.185.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.185.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.186.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.186.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.186.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.187.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.187.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.187.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.188.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.188.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.188.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.189.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.189.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.189.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.19.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.19.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.19.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.190.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.190.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.190.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.191.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.191.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.191.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.192.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.192.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.192.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.193.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.193.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.193.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.194.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.194.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.194.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.195.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.195.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.195.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.196.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.196.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.196.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.197.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.197.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.197.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.198.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.198.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.198.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.199.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.199.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.199.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.2.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.2.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.2.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.20.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.20.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.20.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.200.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.200.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.200.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.201.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.201.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.201.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.202.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.202.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.202.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.203.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.203.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.203.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.204.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.204.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.204.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.205.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.205.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.205.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.206.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.206.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.206.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.207.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.207.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.207.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.208.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.208.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.208.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.209.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.209.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.209.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.21.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.21.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.21.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.210.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.210.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.210.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.211.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.211.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.211.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.212.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.212.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.212.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.213.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.213.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.213.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.214.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.214.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.214.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.215.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.215.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.215.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.216.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.216.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.216.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.217.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.217.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.217.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.218.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.218.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.218.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.219.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.219.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.219.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.22.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.22.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.22.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.220.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.220.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.220.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.221.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.221.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.221.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.222.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.222.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.222.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.223.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.223.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.223.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.224.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.224.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.224.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.225.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.225.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.225.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.226.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.226.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.226.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.227.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.227.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.227.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.228.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.228.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.228.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.229.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.229.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.229.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.23.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.23.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.23.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.230.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.230.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.230.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.231.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.231.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.231.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.232.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.232.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.232.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.233.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.233.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.233.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.234.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.234.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.234.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.235.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.235.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.235.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.236.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.236.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.236.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.237.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.237.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.237.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.238.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.238.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.238.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.239.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.239.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.239.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.24.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.24.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.24.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.240.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.240.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.240.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.241.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.241.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.241.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.242.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.242.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.242.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.243.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.243.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.243.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.244.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.244.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.244.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.245.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.245.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.245.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.246.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.246.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.246.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.247.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.247.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.247.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.248.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.248.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.248.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.249.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.249.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.249.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.25.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.25.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.25.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.250.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.250.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.250.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.251.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.251.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.251.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.252.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.252.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.252.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.253.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.253.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.253.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.254.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.254.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.254.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.255.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.255.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.255.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.26.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.26.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.26.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.27.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.27.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.27.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.28.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.28.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.28.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.29.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.29.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.29.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.3.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.3.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.3.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.30.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.30.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.30.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.31.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.31.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.31.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.32.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.32.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.32.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.33.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.33.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.33.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.34.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.34.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.34.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.35.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.35.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.35.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.36.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.36.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.36.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.37.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.37.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.37.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.38.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.38.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.38.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.39.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.39.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.39.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.4.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.4.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.4.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.40.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.40.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.40.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.41.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.41.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.41.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.42.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.42.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.42.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.43.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.43.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.43.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.44.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.44.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.44.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.45.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.45.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.45.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.46.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.46.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.46.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.47.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.47.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.47.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.48.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.48.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.48.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.49.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.49.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.49.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.5.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.5.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.5.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.50.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.50.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.50.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.51.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.51.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.51.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.52.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.52.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.52.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.53.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.53.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.53.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.54.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.54.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.54.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.55.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.55.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.55.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.56.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.56.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.56.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.57.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.57.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.57.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.58.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.58.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.58.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.59.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.59.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.59.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.6.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.6.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.6.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.60.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.60.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.60.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.61.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.61.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.61.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.62.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.62.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.62.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.63.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.63.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.63.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.64.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.64.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.64.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.65.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.65.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.65.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.66.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.66.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.66.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.67.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.67.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.67.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.68.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.68.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.68.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.69.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.69.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.69.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.7.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.7.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.7.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.70.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.70.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.70.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.71.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.71.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.71.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.72.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.72.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.72.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.73.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.73.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.73.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.74.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.74.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.74.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.75.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.75.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.75.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.76.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.76.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.76.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.77.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.77.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.77.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.78.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.78.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.78.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.79.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.79.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.79.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.8.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.8.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.8.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.80.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.80.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.80.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.81.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.81.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.81.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.82.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.82.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.82.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.83.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.83.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.83.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.84.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.84.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.84.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.85.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.85.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.85.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.86.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.86.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.86.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.87.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.87.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.87.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.88.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.88.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.88.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.89.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.89.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.89.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.9.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.9.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.9.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.90.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.90.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.90.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.91.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.91.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.91.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.92.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.92.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.92.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.93.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.93.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.93.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.94.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.94.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.94.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.95.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.95.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.95.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.96.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.96.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.96.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.97.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.97.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.97.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.98.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.98.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.98.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.99.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.99.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.down_proj_list.99.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.0.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.0.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.0.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.1.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.1.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.1.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.10.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.10.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.10.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.100.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.100.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.100.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.101.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.101.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.101.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.102.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.102.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.102.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.103.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.103.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.103.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.104.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.104.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.104.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.105.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.105.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.105.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.106.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.106.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.106.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.107.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.107.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.107.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.108.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.108.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.108.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.109.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.109.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.109.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.11.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.11.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.11.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.110.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.110.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.110.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.111.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.111.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.111.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.112.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.112.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.112.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.113.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.113.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.113.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.114.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.114.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.114.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.115.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.115.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.115.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.116.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.116.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.116.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.117.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.117.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.117.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.118.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.118.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.118.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.119.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.119.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.119.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.12.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.12.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.12.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.120.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.120.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.120.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.121.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.121.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.121.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.122.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.122.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.122.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.123.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.123.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.123.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.124.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.124.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.124.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.125.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.125.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.125.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.126.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.126.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.126.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.127.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.127.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.127.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.128.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.128.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.128.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.129.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.129.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.129.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.13.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.13.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.13.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.130.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.130.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.130.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.131.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.131.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.131.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.132.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.132.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.132.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.133.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.133.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.133.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.134.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.134.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.134.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.135.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.135.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.135.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.136.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.136.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.136.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.137.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.137.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.137.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.138.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.138.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.138.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.139.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.139.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.139.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.14.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.14.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.14.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.140.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.140.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.140.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.141.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.141.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.141.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.142.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.142.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.142.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.143.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.143.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.143.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.144.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.144.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.144.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.145.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.145.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.145.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.146.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.146.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.146.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.147.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.147.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.147.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.148.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.148.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.148.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.149.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.149.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.149.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.15.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.15.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.15.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.150.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.150.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.150.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.151.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.151.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.151.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.152.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.152.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.152.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.153.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.153.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.153.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.154.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.154.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.154.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.155.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.155.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.155.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.156.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.156.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.156.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.157.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.157.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.157.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.158.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.158.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.158.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.159.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.159.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.159.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.16.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.16.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.16.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.160.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.160.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.160.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.161.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.161.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.161.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.162.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.162.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.162.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.163.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.163.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.163.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.164.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.164.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.164.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.165.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.165.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.165.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.166.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.166.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.166.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.167.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.167.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.167.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.168.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.168.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.168.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.169.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.169.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.169.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.17.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.17.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.17.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.170.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.170.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.170.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.171.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.171.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.171.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.172.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.172.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.172.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.173.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.173.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.173.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.174.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.174.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.174.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.175.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.175.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.175.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.176.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.176.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.176.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.177.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.177.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.177.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.178.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.178.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.178.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.179.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.179.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.179.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.18.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.18.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.18.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.180.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.180.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.180.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.181.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.181.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.181.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.182.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.182.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.182.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.183.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.183.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.183.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.184.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.184.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.184.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.185.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.185.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.185.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.186.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.186.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.186.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.187.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.187.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.187.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.188.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.188.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.188.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.189.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.189.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.189.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.19.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.19.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.19.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.190.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.190.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.190.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.191.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.191.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.191.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.192.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.192.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.192.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.193.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.193.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.193.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.194.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.194.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.194.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.195.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.195.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.195.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.196.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.196.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.196.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.197.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.197.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.197.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.198.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.198.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.198.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.199.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.199.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.199.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.2.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.2.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.2.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.20.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.20.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.20.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.200.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.200.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.200.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.201.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.201.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.201.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.202.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.202.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.202.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.203.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.203.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.203.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.204.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.204.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.204.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.205.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.205.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.205.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.206.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.206.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.206.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.207.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.207.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.207.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.208.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.208.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.208.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.209.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.209.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.209.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.21.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.21.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.21.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.210.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.210.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.210.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.211.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.211.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.211.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.212.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.212.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.212.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.213.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.213.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.213.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.214.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.214.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.214.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.215.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.215.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.215.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.216.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.216.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.216.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.217.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.217.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.217.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.218.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.218.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.218.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.219.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.219.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.219.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.22.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.22.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.22.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.220.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.220.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.220.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.221.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.221.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.221.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.222.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.222.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.222.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.223.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.223.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.223.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.224.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.224.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.224.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.225.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.225.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.225.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.226.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.226.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.226.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.227.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.227.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.227.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.228.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.228.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.228.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.229.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.229.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.229.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.23.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.23.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.23.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.230.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.230.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.230.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.231.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.231.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.231.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.232.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.232.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.232.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.233.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.233.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.233.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.234.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.234.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.234.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.235.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.235.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.235.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.236.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.236.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.236.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.237.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.237.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.237.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.238.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.238.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.238.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.239.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.239.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.239.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.24.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.24.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.24.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.240.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.240.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.240.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.241.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.241.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.241.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.242.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.242.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.242.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.243.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.243.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.243.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.244.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.244.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.244.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.245.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.245.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.245.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.246.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.246.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.246.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.247.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.247.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.247.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.248.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.248.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.248.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.249.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.249.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.249.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.25.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.25.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.25.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.250.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.250.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.250.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.251.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.251.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.251.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.252.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.252.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.252.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.253.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.253.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.253.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.254.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.254.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.254.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.255.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.255.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.255.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.26.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.26.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.26.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.27.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.27.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.27.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.28.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.28.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.28.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.29.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.29.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.29.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.3.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.3.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.3.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.30.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.30.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.30.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.31.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.31.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.31.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.32.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.32.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.32.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.33.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.33.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.33.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.34.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.34.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.34.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.35.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.35.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.35.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.36.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.36.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.36.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.37.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.37.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.37.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.38.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.38.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.38.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.39.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.39.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.39.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.4.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.4.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.4.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.40.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.40.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.40.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.41.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.41.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.41.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.42.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.42.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.42.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.43.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.43.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.43.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.44.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.44.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.44.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.45.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.45.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.45.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.46.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.46.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.46.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.47.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.47.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.47.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.48.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.48.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.48.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.49.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.49.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.49.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.5.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.5.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.5.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.50.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.50.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.50.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.51.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.51.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.51.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.52.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.52.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.52.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.53.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.53.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.53.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.54.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.54.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.54.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.55.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.55.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.55.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.56.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.56.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.56.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.57.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.57.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.57.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.58.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.58.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.58.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.59.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.59.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.59.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.6.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.6.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.6.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.60.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.60.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.60.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.61.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.61.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.61.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.62.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.62.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.62.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.63.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.63.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.63.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.64.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.64.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.64.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.65.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.65.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.65.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.66.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.66.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.66.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.67.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.67.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.67.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.68.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.68.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.68.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.69.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.69.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.69.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.7.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.7.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.7.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.70.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.70.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.70.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.71.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.71.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.71.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.72.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.72.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.72.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.73.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.73.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.73.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.74.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.74.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.74.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.75.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.75.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.75.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.76.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.76.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.76.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.77.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.77.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.77.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.78.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.78.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.78.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.79.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.79.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.79.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.8.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.8.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.8.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.80.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.80.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.80.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.81.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.81.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.81.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.82.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.82.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.82.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.83.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.83.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.83.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.84.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.84.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.84.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.85.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.85.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.85.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.86.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.86.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.86.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.87.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.87.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.87.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.88.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.88.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.88.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.89.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.89.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.89.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.9.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.9.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.9.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.90.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.90.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.90.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.91.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.91.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.91.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.92.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.92.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.92.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.93.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.93.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.93.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.94.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.94.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.94.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.95.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.95.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.95.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.96.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.96.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.96.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.97.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.97.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.97.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.98.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.98.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.98.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.99.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.99.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.experts.gate_up_proj_list.99.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.gate.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.shared_expert.down_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.shared_expert.down_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.shared_expert.down_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.shared_expert.gate_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.shared_expert.gate_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.shared_expert.gate_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.shared_expert.up_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.shared_expert.up_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.shared_expert.up_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.shared_expert_gate.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.shared_expert_gate.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.30.mlp.shared_expert_gate.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.30.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.31.input_layernorm.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.0.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.0.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.0.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.1.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.1.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.1.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.10.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.10.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.10.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.100.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.100.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.100.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.101.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.101.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.101.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.102.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.102.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.102.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.103.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.103.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.103.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.104.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.104.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.104.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.105.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.105.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.105.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.106.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.106.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.106.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.107.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.107.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.107.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.108.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.108.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.108.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.109.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.109.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.109.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.11.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.11.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.11.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.110.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.110.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.110.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.111.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.111.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.111.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.112.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.112.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.112.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.113.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.113.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.113.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.114.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.114.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.114.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.115.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.115.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.115.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.116.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.116.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.116.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.117.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.117.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.117.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.118.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.118.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.118.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.119.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.119.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.119.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.12.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.12.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.12.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.120.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.120.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.120.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.121.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.121.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.121.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.122.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.122.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.122.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.123.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.123.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.123.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.124.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.124.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.124.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.125.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.125.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.125.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.126.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.126.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.126.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.127.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.127.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.127.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.128.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.128.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.128.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.129.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.129.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.129.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.13.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.13.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.13.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.130.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.130.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.130.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.131.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.131.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.131.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.132.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.132.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.132.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.133.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.133.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.133.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.134.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.134.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.134.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.135.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.135.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.135.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.136.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.136.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.136.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.137.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.137.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.137.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.138.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.138.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.138.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.139.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.139.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.139.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.14.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.14.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.14.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.140.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.140.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.140.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.141.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.141.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.141.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.142.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.142.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.142.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.143.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.143.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.143.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.144.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.144.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.144.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.145.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.145.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.145.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.146.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.146.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.146.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.147.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.147.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.147.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.148.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.148.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.148.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.149.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.149.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.149.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.15.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.15.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.15.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.150.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.150.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.150.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.151.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.151.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.151.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.152.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.152.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.152.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.153.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.153.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.153.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.154.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.154.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.154.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.155.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.155.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.155.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.156.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.156.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.156.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.157.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.157.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.157.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.158.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.158.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.158.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.159.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.159.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.159.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.16.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.16.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.16.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.160.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.160.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.160.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.161.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.161.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.161.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.162.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.162.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.162.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.163.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.163.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.163.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.164.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.164.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.164.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.165.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.165.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.165.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.166.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.166.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.166.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.167.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.167.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.167.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.168.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.168.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.168.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.169.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.169.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.169.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.17.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.17.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.17.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.170.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.170.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.170.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.171.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.171.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.171.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.172.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.172.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.172.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.173.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.173.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.173.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.174.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.174.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.174.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.175.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.175.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.175.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.176.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.176.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.176.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.177.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.177.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.177.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.178.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.178.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.178.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.179.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.179.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.179.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.18.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.18.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.18.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.180.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.180.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.180.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.181.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.181.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.181.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.182.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.182.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.182.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.183.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.183.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.183.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.184.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.184.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.184.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.185.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.185.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.185.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.186.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.186.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.186.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.187.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.187.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.187.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.188.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.188.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.188.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.189.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.189.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.189.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.19.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.19.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.19.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.190.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.190.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.190.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.191.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.191.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.191.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.192.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.192.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.192.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.193.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.193.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.193.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.194.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.194.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.194.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.195.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.195.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.195.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.196.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.196.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.196.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.197.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.197.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.197.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.198.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.198.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.198.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.199.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.199.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.199.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.2.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.2.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.2.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.20.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.20.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.20.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.200.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.200.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.200.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.201.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.201.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.201.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.202.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.202.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.202.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.203.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.203.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.203.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.204.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.204.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.204.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.205.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.205.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.205.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.206.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.206.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.206.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.207.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.207.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.207.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.208.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.208.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.208.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.209.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.209.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.209.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.21.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.21.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.21.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.210.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.210.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.210.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.211.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.211.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.211.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.212.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.212.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.212.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.213.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.213.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.213.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.214.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.214.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.214.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.215.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.215.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.215.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.216.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.216.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.216.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.217.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.217.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.217.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.218.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.218.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.218.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.219.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.219.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.219.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.22.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.22.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.22.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.220.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.220.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.220.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.221.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.221.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.221.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.222.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.222.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.222.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.223.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.223.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.223.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.224.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.224.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.224.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.225.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.225.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.225.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.226.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.226.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.226.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.227.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.227.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.227.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.228.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.228.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.228.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.229.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.229.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.229.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.23.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.23.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.23.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.230.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.230.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.230.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.231.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.231.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.231.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.232.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.232.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.232.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.233.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.233.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.233.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.234.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.234.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.234.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.235.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.235.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.235.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.236.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.236.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.236.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.237.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.237.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.237.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.238.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.238.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.238.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.239.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.239.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.239.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.24.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.24.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.24.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.240.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.240.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.240.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.241.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.241.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.241.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.242.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.242.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.242.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.243.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.243.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.243.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.244.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.244.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.244.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.245.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.245.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.245.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.246.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.246.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.246.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.247.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.247.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.247.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.248.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.248.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.248.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.249.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.249.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.249.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.25.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.25.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.25.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.250.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.250.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.250.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.251.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.251.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.251.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.252.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.252.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.252.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.253.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.253.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.253.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.254.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.254.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.254.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.255.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.255.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.255.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.26.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.26.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.26.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.27.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.27.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.27.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.28.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.28.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.28.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.29.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.29.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.29.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.3.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.3.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.3.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.30.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.30.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.30.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.31.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.31.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.31.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.32.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.32.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.32.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.33.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.33.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.33.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.34.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.34.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.34.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.35.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.35.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.35.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.36.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.36.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.36.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.37.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.37.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.37.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.38.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.38.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.38.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.39.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.39.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.39.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.4.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.4.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.4.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.40.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.40.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.40.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.41.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.41.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.41.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.42.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.42.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.42.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.43.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.43.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.43.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.44.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.44.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.44.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.45.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.45.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.45.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.46.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.46.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.46.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.47.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.47.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.47.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.48.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.48.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.48.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.49.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.49.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.49.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.5.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.5.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.5.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.50.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.50.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.50.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.51.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.51.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.51.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.52.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.52.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.52.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.53.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.53.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.53.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.54.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.54.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.54.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.55.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.55.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.55.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.56.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.56.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.56.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.57.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.57.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.57.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.58.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.58.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.58.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.59.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.59.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.59.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.6.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.6.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.6.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.60.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.60.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.60.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.61.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.61.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.61.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.62.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.62.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.62.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.63.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.63.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.63.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.64.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.64.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.64.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.65.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.65.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.65.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.66.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.66.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.66.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.67.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.67.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.67.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.68.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.68.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.68.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.69.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.69.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.69.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.7.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.7.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.7.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.70.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.70.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.70.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.71.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.71.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.71.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.72.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.72.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.72.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.73.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.73.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.73.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.74.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.74.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.74.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.75.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.75.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.75.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.76.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.76.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.76.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.77.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.77.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.77.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.78.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.78.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.78.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.79.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.79.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.79.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.8.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.8.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.8.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.80.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.80.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.80.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.81.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.81.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.81.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.82.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.82.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.82.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.83.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.83.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.83.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.84.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.84.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.84.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.85.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.85.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.85.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.86.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.86.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.86.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.87.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.87.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.87.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.88.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.88.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.88.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.89.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.89.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.89.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.9.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.9.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.9.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.90.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.90.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.90.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.91.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.91.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.91.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.92.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.92.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.92.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.93.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.93.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.93.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.94.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.94.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.94.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.95.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.95.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.95.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.96.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.96.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.96.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.97.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.97.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.97.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.98.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.98.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.98.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.99.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.99.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.down_proj_list.99.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.0.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.0.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.0.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.1.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.1.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.1.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.10.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.10.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.10.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.100.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.100.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.100.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.101.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.101.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.101.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.102.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.102.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.102.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.103.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.103.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.103.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.104.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.104.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.104.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.105.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.105.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.105.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.106.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.106.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.106.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.107.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.107.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.107.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.108.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.108.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.108.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.109.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.109.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.109.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.11.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.11.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.11.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.110.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.110.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.110.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.111.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.111.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.111.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.112.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.112.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.112.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.113.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.113.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.113.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.114.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.114.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.114.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.115.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.115.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.115.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.116.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.116.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.116.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.117.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.117.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.117.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.118.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.118.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.118.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.119.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.119.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.119.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.12.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.12.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.12.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.120.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.120.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.120.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.121.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.121.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.121.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.122.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.122.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.122.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.123.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.123.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.123.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.124.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.124.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.124.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.125.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.125.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.125.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.126.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.126.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.126.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.127.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.127.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.127.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.128.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.128.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.128.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.129.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.129.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.129.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.13.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.13.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.13.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.130.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.130.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.130.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.131.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.131.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.131.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.132.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.132.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.132.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.133.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.133.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.133.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.134.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.134.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.134.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.135.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.135.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.135.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.136.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.136.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.136.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.137.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.137.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.137.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.138.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.138.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.138.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.139.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.139.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.139.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.14.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.14.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.14.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.140.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.140.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.140.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.141.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.141.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.141.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.142.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.142.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.142.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.143.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.143.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.143.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.144.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.144.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.144.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.145.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.145.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.145.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.146.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.146.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.146.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.147.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.147.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.147.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.148.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.148.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.148.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.149.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.149.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.149.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.15.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.15.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.15.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.150.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.150.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.150.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.151.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.151.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.151.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.152.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.152.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.152.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.153.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.153.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.153.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.154.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.154.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.154.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.155.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.155.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.155.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.156.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.156.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.156.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.157.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.157.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.157.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.158.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.158.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.158.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.159.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.159.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.159.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.16.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.16.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.16.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.160.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.160.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.160.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.161.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.161.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.161.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.162.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.162.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.162.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.163.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.163.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.163.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.164.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.164.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.164.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.165.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.165.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.165.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.166.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.166.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.166.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.167.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.167.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.167.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.168.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.168.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.168.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.169.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.169.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.169.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.17.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.17.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.17.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.170.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.170.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.170.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.171.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.171.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.171.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.172.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.172.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.172.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.173.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.173.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.173.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.174.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.174.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.174.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.175.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.175.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.175.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.176.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.176.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.176.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.177.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.177.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.177.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.178.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.178.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.178.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.179.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.179.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.179.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.18.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.18.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.18.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.180.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.180.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.180.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.181.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.181.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.181.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.182.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.182.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.182.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.183.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.183.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.183.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.184.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.184.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.184.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.185.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.185.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.185.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.186.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.186.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.186.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.187.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.187.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.187.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.188.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.188.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.188.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.189.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.189.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.189.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.19.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.19.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.19.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.190.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.190.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.190.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.191.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.191.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.191.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.192.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.192.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.192.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.193.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.193.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.193.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.194.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.194.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.194.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.195.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.195.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.195.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.196.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.196.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.196.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.197.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.197.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.197.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.198.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.198.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.198.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.199.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.199.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.199.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.2.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.2.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.2.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.20.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.20.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.20.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.200.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.200.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.200.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.201.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.201.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.201.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.202.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.202.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.202.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.203.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.203.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.203.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.204.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.204.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.204.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.205.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.205.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.205.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.206.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.206.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.206.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.207.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.207.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.207.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.208.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.208.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.208.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.209.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.209.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.209.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.21.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.21.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.21.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.210.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.210.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.210.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.211.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.211.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.211.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.212.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.212.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.212.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.213.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.213.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.213.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.214.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.214.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.214.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.215.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.215.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.215.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.216.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.216.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.216.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.217.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.217.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.217.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.218.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.218.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.218.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.219.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.219.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.219.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.22.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.22.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.22.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.220.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.220.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.220.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.221.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.221.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.221.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.222.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.222.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.222.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.223.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.223.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.223.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.224.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.224.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.224.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.225.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.225.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.225.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.226.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.226.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.226.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.227.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.227.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.227.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.228.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.228.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.228.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.229.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.229.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.229.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.23.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.23.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.23.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.230.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.230.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.230.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.231.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.231.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.231.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.232.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.232.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.232.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.233.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.233.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.233.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.234.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.234.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.234.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.235.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.235.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.235.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.236.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.236.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.236.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.237.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.237.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.237.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.238.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.238.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.238.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.239.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.239.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.239.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.24.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.24.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.24.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.240.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.240.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.240.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.241.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.241.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.241.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.242.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.242.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.242.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.243.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.243.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.243.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.244.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.244.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.244.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.245.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.245.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.245.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.246.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.246.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.246.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.247.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.247.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.247.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.248.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.248.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.248.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.249.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.249.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.249.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.25.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.25.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.25.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.250.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.250.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.250.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.251.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.251.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.251.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.252.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.252.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.252.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.253.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.253.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.253.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.254.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.254.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.254.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.255.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.255.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.255.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.26.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.26.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.26.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.27.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.27.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.27.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.28.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.28.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.28.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.29.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.29.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.29.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.3.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.3.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.3.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.30.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.30.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.30.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.31.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.31.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.31.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.32.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.32.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.32.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.33.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.33.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.33.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.34.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.34.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.34.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.35.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.35.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.35.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.36.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.36.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.36.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.37.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.37.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.37.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.38.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.38.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.38.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.39.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.39.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.39.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.4.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.4.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.4.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.40.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.40.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.40.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.41.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.41.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.41.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.42.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.42.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.42.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.43.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.43.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.43.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.44.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.44.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.44.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.45.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.45.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.45.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.46.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.46.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.46.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.47.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.47.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.47.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.48.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.48.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.48.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.49.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.49.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.49.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.5.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.5.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.5.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.50.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.50.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.50.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.51.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.51.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.51.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.52.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.52.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.52.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.53.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.53.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.53.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.54.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.54.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.54.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.55.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.55.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.55.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.56.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.56.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.56.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.57.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.57.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.57.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.58.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.58.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.58.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.59.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.59.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.59.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.6.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.6.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.6.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.60.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.60.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.60.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.61.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.61.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.61.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.62.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.62.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.62.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.63.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.63.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.63.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.64.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.64.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.64.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.65.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.65.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.65.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.66.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.66.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.66.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.67.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.67.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.67.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.68.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.68.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.68.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.69.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.69.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.69.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.7.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.7.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.7.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.70.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.70.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.70.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.71.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.71.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.71.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.72.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.72.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.72.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.73.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.73.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.73.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.74.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.74.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.74.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.75.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.75.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.75.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.76.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.76.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.76.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.77.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.77.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.77.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.78.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.78.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.78.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.79.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.79.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.79.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.8.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.8.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.8.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.80.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.80.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.80.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.81.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.81.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.81.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.82.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.82.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.82.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.83.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.83.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.83.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.84.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.84.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.84.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.85.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.85.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.85.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.86.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.86.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.86.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.87.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.87.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.87.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.88.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.88.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.88.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.89.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.89.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.89.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.9.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.9.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.9.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.90.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.90.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.90.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.91.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.91.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.91.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.92.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.92.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.92.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.93.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.93.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.93.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.94.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.94.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.94.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.95.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.95.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.95.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.96.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.96.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.96.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.97.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.97.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.97.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.98.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.98.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.98.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.99.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.99.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.experts.gate_up_proj_list.99.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.gate.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.shared_expert.down_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.shared_expert.down_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.shared_expert.down_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.shared_expert.gate_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.shared_expert.gate_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.shared_expert.gate_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.shared_expert.up_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.shared_expert.up_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.shared_expert.up_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.shared_expert_gate.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.shared_expert_gate.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.mlp.shared_expert_gate.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.31.self_attn.k_norm.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.31.self_attn.k_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.self_attn.k_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.self_attn.k_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.self_attn.o_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.self_attn.o_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.self_attn.o_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.self_attn.q_norm.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.31.self_attn.q_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.self_attn.q_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.self_attn.q_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.31.self_attn.v_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.31.self_attn.v_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.31.self_attn.v_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.input_layernorm.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.32.linear_attn.A_log": "model-00003-of-00004.safetensors", "model.language_model.layers.32.linear_attn.conv1d.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.32.linear_attn.dt_bias": "model-00003-of-00004.safetensors", "model.language_model.layers.32.linear_attn.in_proj_a.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.linear_attn.in_proj_a.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.linear_attn.in_proj_a.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.linear_attn.in_proj_b.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.linear_attn.in_proj_b.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.linear_attn.in_proj_b.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.linear_attn.in_proj_qkv.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.linear_attn.in_proj_qkv.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.linear_attn.in_proj_qkv.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.linear_attn.in_proj_z.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.linear_attn.in_proj_z.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.linear_attn.in_proj_z.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.linear_attn.norm.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.32.linear_attn.out_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.linear_attn.out_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.linear_attn.out_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.0.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.0.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.0.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.1.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.1.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.1.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.10.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.10.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.10.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.100.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.100.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.100.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.101.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.101.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.101.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.102.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.102.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.102.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.103.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.103.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.103.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.104.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.104.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.104.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.105.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.105.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.105.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.106.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.106.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.106.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.107.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.107.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.107.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.108.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.108.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.108.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.109.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.109.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.109.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.11.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.11.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.11.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.110.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.110.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.110.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.111.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.111.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.111.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.112.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.112.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.112.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.113.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.113.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.113.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.114.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.114.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.114.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.115.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.115.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.115.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.116.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.116.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.116.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.117.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.117.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.117.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.118.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.118.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.118.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.119.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.119.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.119.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.12.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.12.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.12.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.120.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.120.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.120.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.121.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.121.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.121.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.122.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.122.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.122.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.123.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.123.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.123.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.124.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.124.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.124.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.125.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.125.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.125.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.126.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.126.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.126.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.127.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.127.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.127.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.128.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.128.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.128.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.129.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.129.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.129.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.13.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.13.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.13.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.130.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.130.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.130.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.131.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.131.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.131.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.132.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.132.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.132.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.133.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.133.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.133.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.134.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.134.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.134.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.135.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.135.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.135.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.136.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.136.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.136.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.137.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.137.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.137.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.138.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.138.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.138.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.139.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.139.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.139.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.14.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.14.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.14.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.140.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.140.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.140.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.141.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.141.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.141.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.142.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.142.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.142.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.143.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.143.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.143.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.144.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.144.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.144.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.145.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.145.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.145.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.146.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.146.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.146.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.147.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.147.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.147.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.148.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.148.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.148.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.149.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.149.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.149.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.15.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.15.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.15.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.150.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.150.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.150.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.151.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.151.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.151.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.152.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.152.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.152.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.153.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.153.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.153.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.154.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.154.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.154.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.155.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.155.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.155.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.156.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.156.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.156.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.157.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.157.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.157.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.158.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.158.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.158.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.159.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.159.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.159.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.16.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.16.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.16.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.160.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.160.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.160.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.161.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.161.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.161.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.162.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.162.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.162.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.163.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.163.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.163.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.164.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.164.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.164.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.165.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.165.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.165.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.166.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.166.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.166.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.167.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.167.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.167.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.168.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.168.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.168.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.169.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.169.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.169.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.17.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.17.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.17.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.170.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.170.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.170.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.171.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.171.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.171.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.172.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.172.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.172.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.173.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.173.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.173.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.174.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.174.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.174.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.175.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.175.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.175.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.176.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.176.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.176.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.177.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.177.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.177.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.178.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.178.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.178.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.179.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.179.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.179.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.18.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.18.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.18.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.180.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.180.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.180.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.181.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.181.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.181.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.182.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.182.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.182.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.183.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.183.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.183.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.184.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.184.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.184.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.185.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.185.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.185.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.186.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.186.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.186.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.187.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.187.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.187.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.188.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.188.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.188.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.189.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.189.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.189.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.19.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.19.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.19.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.190.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.190.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.190.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.191.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.191.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.191.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.192.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.192.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.192.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.193.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.193.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.193.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.194.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.194.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.194.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.195.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.195.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.195.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.196.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.196.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.196.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.197.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.197.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.197.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.198.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.198.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.198.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.199.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.199.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.199.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.2.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.2.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.2.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.20.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.20.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.20.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.200.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.200.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.200.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.201.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.201.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.201.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.202.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.202.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.202.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.203.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.203.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.203.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.204.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.204.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.204.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.205.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.205.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.205.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.206.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.206.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.206.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.207.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.207.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.207.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.208.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.208.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.208.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.209.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.209.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.209.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.21.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.21.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.21.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.210.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.210.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.210.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.211.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.211.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.211.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.212.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.212.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.212.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.213.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.213.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.213.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.214.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.214.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.214.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.215.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.215.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.215.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.216.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.216.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.216.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.217.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.217.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.217.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.218.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.218.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.218.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.219.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.219.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.219.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.22.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.22.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.22.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.220.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.220.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.220.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.221.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.221.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.221.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.222.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.222.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.222.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.223.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.223.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.223.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.224.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.224.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.224.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.225.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.225.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.225.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.226.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.226.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.226.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.227.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.227.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.227.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.228.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.228.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.228.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.229.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.229.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.229.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.23.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.23.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.23.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.230.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.230.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.230.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.231.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.231.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.231.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.232.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.232.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.232.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.233.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.233.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.233.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.234.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.234.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.234.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.235.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.235.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.235.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.236.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.236.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.236.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.237.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.237.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.237.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.238.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.238.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.238.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.239.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.239.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.239.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.24.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.24.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.24.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.240.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.240.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.240.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.241.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.241.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.241.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.242.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.242.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.242.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.243.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.243.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.243.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.244.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.244.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.244.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.245.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.245.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.245.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.246.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.246.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.246.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.247.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.247.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.247.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.248.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.248.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.248.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.249.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.249.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.249.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.25.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.25.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.25.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.250.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.250.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.250.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.251.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.251.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.251.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.252.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.252.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.252.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.253.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.253.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.253.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.254.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.254.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.254.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.255.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.255.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.255.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.26.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.26.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.26.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.27.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.27.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.27.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.28.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.28.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.28.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.29.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.29.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.29.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.3.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.3.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.3.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.30.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.30.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.30.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.31.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.31.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.31.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.32.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.32.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.32.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.33.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.33.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.33.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.34.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.34.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.34.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.35.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.35.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.35.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.36.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.36.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.36.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.37.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.37.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.37.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.38.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.38.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.38.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.39.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.39.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.39.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.4.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.4.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.4.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.40.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.40.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.40.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.41.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.41.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.41.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.42.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.42.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.42.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.43.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.43.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.43.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.44.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.44.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.44.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.45.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.45.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.45.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.46.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.46.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.46.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.47.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.47.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.47.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.48.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.48.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.48.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.49.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.49.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.49.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.5.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.5.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.5.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.50.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.50.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.50.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.51.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.51.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.51.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.52.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.52.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.52.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.53.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.53.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.53.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.54.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.54.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.54.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.55.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.55.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.55.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.56.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.56.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.56.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.57.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.57.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.57.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.58.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.58.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.58.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.59.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.59.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.59.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.6.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.6.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.6.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.60.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.60.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.60.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.61.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.61.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.61.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.62.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.62.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.62.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.63.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.63.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.63.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.64.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.64.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.64.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.65.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.65.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.65.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.66.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.66.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.66.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.67.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.67.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.67.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.68.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.68.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.68.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.69.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.69.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.69.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.7.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.7.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.7.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.70.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.70.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.70.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.71.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.71.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.71.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.72.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.72.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.72.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.73.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.73.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.73.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.74.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.74.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.74.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.75.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.75.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.75.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.76.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.76.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.76.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.77.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.77.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.77.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.78.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.78.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.78.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.79.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.79.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.79.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.8.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.8.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.8.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.80.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.80.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.80.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.81.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.81.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.81.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.82.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.82.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.82.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.83.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.83.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.83.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.84.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.84.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.84.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.85.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.85.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.85.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.86.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.86.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.86.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.87.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.87.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.87.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.88.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.88.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.88.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.89.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.89.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.89.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.9.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.9.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.9.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.90.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.90.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.90.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.91.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.91.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.91.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.92.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.92.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.92.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.93.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.93.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.93.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.94.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.94.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.94.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.95.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.95.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.95.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.96.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.96.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.96.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.97.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.97.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.97.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.98.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.98.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.98.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.99.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.99.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.down_proj_list.99.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.0.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.0.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.0.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.1.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.1.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.1.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.10.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.10.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.10.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.100.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.100.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.100.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.101.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.101.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.101.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.102.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.102.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.102.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.103.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.103.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.103.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.104.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.104.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.104.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.105.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.105.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.105.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.106.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.106.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.106.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.107.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.107.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.107.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.108.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.108.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.108.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.109.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.109.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.109.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.11.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.11.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.11.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.110.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.110.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.110.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.111.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.111.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.111.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.112.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.112.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.112.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.113.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.113.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.113.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.114.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.114.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.114.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.115.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.115.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.115.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.116.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.116.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.116.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.117.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.117.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.117.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.118.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.118.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.118.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.119.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.119.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.119.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.12.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.12.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.12.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.120.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.120.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.120.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.121.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.121.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.121.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.122.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.122.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.122.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.123.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.123.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.123.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.124.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.124.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.124.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.125.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.125.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.125.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.126.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.126.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.126.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.127.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.127.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.127.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.128.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.128.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.128.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.129.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.129.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.129.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.13.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.13.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.13.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.130.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.130.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.130.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.131.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.131.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.131.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.132.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.132.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.132.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.133.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.133.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.133.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.134.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.134.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.134.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.135.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.135.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.135.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.136.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.136.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.136.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.137.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.137.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.137.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.138.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.138.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.138.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.139.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.139.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.139.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.14.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.14.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.14.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.140.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.140.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.140.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.141.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.141.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.141.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.142.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.142.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.142.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.143.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.143.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.143.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.144.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.144.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.144.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.145.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.145.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.145.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.146.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.146.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.146.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.147.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.147.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.147.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.148.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.148.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.148.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.149.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.149.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.149.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.15.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.15.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.15.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.150.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.150.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.150.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.151.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.151.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.151.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.152.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.152.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.152.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.153.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.153.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.153.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.154.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.154.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.154.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.155.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.155.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.155.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.156.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.156.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.156.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.157.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.157.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.157.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.158.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.158.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.158.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.159.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.159.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.159.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.16.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.16.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.16.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.160.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.160.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.160.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.161.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.161.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.161.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.162.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.162.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.162.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.163.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.163.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.163.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.164.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.164.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.164.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.165.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.165.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.165.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.166.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.166.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.166.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.167.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.167.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.167.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.168.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.168.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.168.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.169.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.169.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.169.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.17.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.17.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.17.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.170.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.170.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.170.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.171.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.171.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.171.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.172.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.172.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.172.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.173.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.173.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.173.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.174.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.174.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.174.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.175.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.175.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.175.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.176.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.176.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.176.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.177.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.177.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.177.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.178.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.178.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.178.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.179.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.179.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.179.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.18.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.18.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.18.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.180.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.180.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.180.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.181.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.181.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.181.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.182.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.182.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.182.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.183.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.183.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.183.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.184.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.184.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.184.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.185.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.185.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.185.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.186.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.186.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.186.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.187.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.187.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.187.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.188.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.188.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.188.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.189.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.189.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.189.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.19.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.19.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.19.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.190.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.190.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.190.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.191.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.191.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.191.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.192.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.192.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.192.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.193.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.193.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.193.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.194.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.194.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.194.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.195.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.195.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.195.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.196.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.196.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.196.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.197.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.197.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.197.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.198.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.198.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.198.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.199.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.199.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.199.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.2.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.2.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.2.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.20.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.20.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.20.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.200.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.200.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.200.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.201.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.201.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.201.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.202.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.202.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.202.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.203.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.203.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.203.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.204.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.204.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.204.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.205.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.205.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.205.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.206.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.206.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.206.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.207.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.207.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.207.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.208.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.208.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.208.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.209.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.209.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.209.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.21.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.21.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.21.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.210.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.210.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.210.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.211.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.211.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.211.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.212.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.212.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.212.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.213.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.213.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.213.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.214.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.214.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.214.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.215.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.215.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.215.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.216.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.216.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.216.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.217.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.217.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.217.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.218.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.218.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.218.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.219.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.219.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.219.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.22.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.22.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.22.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.220.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.220.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.220.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.221.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.221.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.221.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.222.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.222.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.222.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.223.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.223.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.223.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.224.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.224.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.224.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.225.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.225.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.225.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.226.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.226.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.226.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.227.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.227.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.227.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.228.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.228.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.228.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.229.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.229.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.229.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.23.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.23.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.23.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.230.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.230.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.230.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.231.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.231.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.231.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.232.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.232.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.232.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.233.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.233.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.233.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.234.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.234.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.234.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.235.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.235.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.235.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.236.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.236.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.236.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.237.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.237.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.237.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.238.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.238.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.238.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.239.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.239.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.239.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.24.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.24.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.24.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.240.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.240.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.240.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.241.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.241.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.241.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.242.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.242.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.242.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.243.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.243.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.243.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.244.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.244.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.244.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.245.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.245.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.245.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.246.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.246.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.246.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.247.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.247.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.247.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.248.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.248.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.248.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.249.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.249.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.249.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.25.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.25.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.25.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.250.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.250.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.250.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.251.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.251.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.251.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.252.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.252.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.252.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.253.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.253.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.253.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.254.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.254.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.254.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.255.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.255.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.255.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.26.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.26.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.26.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.27.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.27.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.27.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.28.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.28.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.28.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.29.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.29.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.29.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.3.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.3.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.3.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.30.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.30.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.30.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.31.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.31.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.31.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.32.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.32.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.32.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.33.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.33.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.33.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.34.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.34.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.34.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.35.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.35.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.35.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.36.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.36.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.36.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.37.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.37.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.37.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.38.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.38.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.38.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.39.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.39.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.39.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.4.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.4.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.4.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.40.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.40.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.40.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.41.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.41.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.41.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.42.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.42.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.42.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.43.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.43.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.43.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.44.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.44.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.44.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.45.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.45.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.45.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.46.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.46.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.46.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.47.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.47.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.47.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.48.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.48.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.48.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.49.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.49.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.49.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.5.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.5.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.5.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.50.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.50.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.50.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.51.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.51.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.51.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.52.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.52.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.52.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.53.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.53.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.53.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.54.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.54.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.54.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.55.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.55.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.55.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.56.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.56.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.56.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.57.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.57.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.57.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.58.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.58.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.58.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.59.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.59.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.59.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.6.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.6.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.6.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.60.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.60.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.60.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.61.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.61.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.61.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.62.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.62.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.62.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.63.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.63.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.63.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.64.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.64.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.64.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.65.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.65.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.65.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.66.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.66.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.66.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.67.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.67.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.67.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.68.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.68.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.68.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.69.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.69.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.69.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.7.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.7.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.7.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.70.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.70.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.70.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.71.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.71.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.71.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.72.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.72.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.72.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.73.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.73.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.73.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.74.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.74.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.74.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.75.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.75.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.75.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.76.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.76.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.76.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.77.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.77.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.77.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.78.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.78.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.78.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.79.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.79.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.79.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.8.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.8.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.8.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.80.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.80.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.80.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.81.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.81.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.81.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.82.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.82.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.82.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.83.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.83.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.83.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.84.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.84.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.84.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.85.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.85.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.85.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.86.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.86.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.86.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.87.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.87.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.87.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.88.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.88.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.88.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.89.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.89.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.89.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.9.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.9.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.9.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.90.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.90.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.90.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.91.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.91.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.91.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.92.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.92.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.92.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.93.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.93.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.93.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.94.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.94.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.94.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.95.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.95.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.95.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.96.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.96.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.96.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.97.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.97.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.97.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.98.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.98.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.98.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.99.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.99.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.experts.gate_up_proj_list.99.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.gate.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.shared_expert.down_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.shared_expert.down_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.shared_expert.down_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.shared_expert.gate_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.shared_expert.gate_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.shared_expert.gate_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.shared_expert.up_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.shared_expert.up_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.shared_expert.up_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.shared_expert_gate.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.shared_expert_gate.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.32.mlp.shared_expert_gate.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.32.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.33.input_layernorm.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.33.linear_attn.A_log": "model-00003-of-00004.safetensors", "model.language_model.layers.33.linear_attn.conv1d.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.33.linear_attn.dt_bias": "model-00003-of-00004.safetensors", "model.language_model.layers.33.linear_attn.in_proj_a.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.linear_attn.in_proj_a.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.linear_attn.in_proj_a.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.linear_attn.in_proj_b.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.linear_attn.in_proj_b.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.linear_attn.in_proj_b.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.linear_attn.in_proj_qkv.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.linear_attn.in_proj_qkv.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.linear_attn.in_proj_qkv.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.linear_attn.in_proj_z.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.linear_attn.in_proj_z.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.linear_attn.in_proj_z.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.linear_attn.norm.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.33.linear_attn.out_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.linear_attn.out_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.linear_attn.out_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.0.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.0.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.0.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.1.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.1.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.1.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.10.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.10.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.10.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.100.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.100.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.100.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.101.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.101.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.101.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.102.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.102.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.102.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.103.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.103.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.103.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.104.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.104.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.104.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.105.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.105.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.105.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.106.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.106.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.106.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.107.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.107.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.107.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.108.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.108.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.108.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.109.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.109.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.109.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.11.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.11.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.11.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.110.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.110.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.110.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.111.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.111.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.111.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.112.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.112.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.112.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.113.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.113.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.113.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.114.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.114.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.114.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.115.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.115.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.115.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.116.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.116.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.116.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.117.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.117.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.117.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.118.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.118.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.118.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.119.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.119.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.119.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.12.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.12.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.12.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.120.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.120.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.120.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.121.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.121.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.121.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.122.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.122.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.122.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.123.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.123.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.123.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.124.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.124.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.124.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.125.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.125.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.125.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.126.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.126.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.126.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.127.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.127.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.127.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.128.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.128.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.128.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.129.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.129.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.129.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.13.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.13.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.13.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.130.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.130.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.130.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.131.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.131.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.131.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.132.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.132.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.132.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.133.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.133.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.133.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.134.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.134.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.134.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.135.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.135.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.135.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.136.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.136.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.136.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.137.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.137.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.137.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.138.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.138.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.138.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.139.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.139.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.139.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.14.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.14.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.14.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.140.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.140.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.140.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.141.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.141.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.141.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.142.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.142.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.142.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.143.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.143.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.143.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.144.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.144.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.144.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.145.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.145.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.145.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.146.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.146.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.146.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.147.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.147.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.147.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.148.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.148.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.148.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.149.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.149.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.149.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.15.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.15.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.15.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.150.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.150.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.150.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.151.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.151.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.151.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.152.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.152.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.152.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.153.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.153.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.153.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.154.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.154.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.154.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.155.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.155.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.155.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.156.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.156.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.156.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.157.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.157.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.157.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.158.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.158.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.158.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.159.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.159.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.159.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.16.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.16.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.16.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.160.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.160.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.160.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.161.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.161.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.161.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.162.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.162.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.162.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.163.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.163.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.163.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.164.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.164.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.164.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.165.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.165.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.165.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.166.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.166.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.166.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.167.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.167.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.167.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.168.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.168.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.168.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.169.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.169.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.169.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.17.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.17.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.17.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.170.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.170.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.170.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.171.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.171.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.171.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.172.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.172.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.172.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.173.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.173.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.173.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.174.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.174.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.174.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.175.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.175.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.175.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.176.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.176.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.176.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.177.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.177.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.177.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.178.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.178.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.178.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.179.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.179.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.179.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.18.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.18.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.18.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.180.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.180.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.180.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.181.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.181.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.181.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.182.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.182.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.182.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.183.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.183.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.183.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.184.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.184.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.184.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.185.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.185.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.185.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.186.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.186.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.186.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.187.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.187.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.187.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.188.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.188.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.188.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.189.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.189.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.189.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.19.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.19.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.19.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.190.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.190.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.190.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.191.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.191.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.191.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.192.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.192.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.192.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.193.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.193.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.193.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.194.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.194.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.194.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.195.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.195.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.195.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.196.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.196.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.196.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.197.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.197.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.197.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.198.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.198.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.198.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.199.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.199.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.199.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.2.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.2.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.2.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.20.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.20.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.20.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.200.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.200.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.200.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.201.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.201.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.201.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.202.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.202.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.202.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.203.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.203.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.203.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.204.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.204.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.204.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.205.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.205.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.205.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.206.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.206.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.206.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.207.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.207.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.207.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.208.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.208.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.208.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.209.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.209.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.209.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.21.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.21.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.21.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.210.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.210.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.210.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.211.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.211.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.211.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.212.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.212.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.212.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.213.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.213.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.213.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.214.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.214.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.214.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.215.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.215.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.215.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.216.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.216.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.216.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.217.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.217.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.217.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.218.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.218.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.218.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.219.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.219.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.219.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.22.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.22.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.22.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.220.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.220.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.220.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.221.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.221.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.221.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.222.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.222.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.222.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.223.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.223.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.223.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.224.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.224.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.224.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.225.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.225.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.225.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.226.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.226.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.226.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.227.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.227.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.227.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.228.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.228.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.228.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.229.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.229.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.229.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.23.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.23.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.23.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.230.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.230.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.230.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.231.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.231.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.231.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.232.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.232.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.232.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.233.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.233.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.233.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.234.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.234.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.234.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.235.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.235.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.235.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.236.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.236.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.236.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.237.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.237.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.237.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.238.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.238.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.238.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.239.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.239.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.239.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.24.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.24.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.24.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.240.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.240.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.240.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.241.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.241.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.241.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.242.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.242.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.242.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.243.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.243.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.243.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.244.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.244.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.244.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.245.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.245.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.245.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.246.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.246.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.246.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.247.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.247.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.247.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.248.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.248.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.248.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.249.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.249.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.249.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.25.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.25.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.25.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.250.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.250.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.250.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.251.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.251.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.251.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.252.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.252.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.252.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.253.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.253.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.253.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.254.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.254.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.254.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.255.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.255.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.255.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.26.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.26.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.26.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.27.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.27.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.27.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.28.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.28.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.28.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.29.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.29.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.29.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.3.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.3.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.3.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.30.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.30.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.30.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.31.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.31.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.31.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.32.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.32.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.32.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.33.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.33.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.33.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.34.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.34.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.34.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.35.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.35.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.35.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.36.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.36.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.36.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.37.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.37.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.37.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.38.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.38.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.38.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.39.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.39.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.39.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.4.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.4.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.4.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.40.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.40.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.40.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.41.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.41.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.41.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.42.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.42.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.42.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.43.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.43.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.43.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.44.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.44.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.44.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.45.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.45.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.45.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.46.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.46.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.46.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.47.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.47.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.47.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.48.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.48.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.48.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.49.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.49.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.49.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.5.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.5.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.5.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.50.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.50.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.50.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.51.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.51.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.51.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.52.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.52.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.52.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.53.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.53.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.53.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.54.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.54.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.54.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.55.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.55.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.55.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.56.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.56.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.56.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.57.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.57.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.57.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.58.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.58.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.58.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.59.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.59.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.59.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.6.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.6.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.6.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.60.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.60.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.60.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.61.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.61.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.61.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.62.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.62.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.62.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.63.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.63.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.63.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.64.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.64.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.64.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.65.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.65.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.65.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.66.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.66.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.66.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.67.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.67.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.67.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.68.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.68.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.68.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.69.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.69.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.69.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.7.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.7.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.7.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.70.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.70.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.70.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.71.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.71.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.71.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.72.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.72.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.72.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.73.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.73.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.73.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.74.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.74.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.74.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.75.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.75.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.75.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.76.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.76.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.76.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.77.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.77.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.77.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.78.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.78.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.78.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.79.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.79.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.79.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.8.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.8.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.8.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.80.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.80.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.80.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.81.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.81.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.81.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.82.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.82.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.82.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.83.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.83.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.83.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.84.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.84.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.84.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.85.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.85.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.85.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.86.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.86.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.86.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.87.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.87.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.87.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.88.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.88.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.88.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.89.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.89.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.89.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.9.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.9.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.9.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.90.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.90.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.90.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.91.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.91.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.91.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.92.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.92.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.92.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.93.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.93.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.93.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.94.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.94.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.94.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.95.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.95.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.95.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.96.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.96.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.96.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.97.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.97.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.97.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.98.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.98.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.98.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.99.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.99.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.down_proj_list.99.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.0.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.0.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.0.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.1.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.1.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.1.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.10.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.10.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.10.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.100.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.100.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.100.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.101.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.101.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.101.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.102.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.102.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.102.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.103.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.103.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.103.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.104.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.104.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.104.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.105.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.105.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.105.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.106.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.106.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.106.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.107.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.107.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.107.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.108.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.108.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.108.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.109.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.109.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.109.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.11.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.11.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.11.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.110.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.110.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.110.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.111.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.111.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.111.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.112.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.112.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.112.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.113.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.113.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.113.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.114.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.114.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.114.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.115.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.115.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.115.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.116.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.116.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.116.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.117.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.117.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.117.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.118.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.118.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.118.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.119.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.119.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.119.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.12.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.12.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.12.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.120.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.120.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.120.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.121.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.121.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.121.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.122.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.122.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.122.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.123.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.123.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.123.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.124.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.124.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.124.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.125.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.125.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.125.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.126.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.126.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.126.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.127.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.127.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.127.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.128.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.128.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.128.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.129.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.129.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.129.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.13.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.13.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.13.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.130.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.130.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.130.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.131.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.131.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.131.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.132.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.132.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.132.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.133.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.133.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.133.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.134.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.134.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.134.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.135.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.135.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.135.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.136.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.136.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.136.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.137.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.137.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.137.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.138.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.138.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.138.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.139.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.139.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.139.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.14.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.14.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.14.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.140.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.140.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.140.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.141.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.141.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.141.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.142.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.142.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.142.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.143.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.143.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.143.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.144.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.144.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.144.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.145.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.145.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.145.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.146.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.146.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.146.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.147.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.147.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.147.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.148.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.148.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.148.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.149.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.149.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.149.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.15.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.15.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.15.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.150.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.150.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.150.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.151.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.151.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.151.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.152.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.152.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.152.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.153.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.153.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.153.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.154.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.154.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.154.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.155.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.155.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.155.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.156.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.156.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.156.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.157.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.157.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.157.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.158.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.158.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.158.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.159.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.159.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.159.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.16.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.16.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.16.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.160.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.160.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.160.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.161.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.161.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.161.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.162.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.162.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.162.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.163.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.163.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.163.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.164.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.164.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.164.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.165.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.165.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.165.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.166.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.166.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.166.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.167.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.167.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.167.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.168.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.168.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.168.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.169.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.169.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.169.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.17.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.17.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.17.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.170.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.170.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.170.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.171.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.171.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.171.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.172.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.172.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.172.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.173.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.173.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.173.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.174.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.174.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.174.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.175.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.175.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.175.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.176.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.176.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.176.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.177.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.177.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.177.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.178.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.178.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.178.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.179.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.179.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.179.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.18.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.18.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.18.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.180.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.180.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.180.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.181.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.181.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.181.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.182.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.182.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.182.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.183.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.183.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.183.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.184.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.184.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.184.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.185.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.185.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.185.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.186.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.186.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.186.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.187.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.187.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.187.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.188.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.188.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.188.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.189.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.189.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.189.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.19.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.19.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.19.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.190.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.190.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.190.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.191.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.191.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.191.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.192.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.192.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.192.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.193.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.193.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.193.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.194.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.194.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.194.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.195.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.195.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.195.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.196.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.196.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.196.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.197.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.197.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.197.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.198.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.198.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.198.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.199.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.199.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.199.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.2.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.2.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.2.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.20.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.20.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.20.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.200.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.200.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.200.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.201.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.201.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.201.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.202.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.202.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.202.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.203.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.203.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.203.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.204.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.204.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.204.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.205.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.205.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.205.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.206.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.206.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.206.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.207.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.207.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.207.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.208.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.208.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.208.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.209.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.209.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.209.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.21.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.21.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.21.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.210.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.210.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.210.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.211.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.211.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.211.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.212.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.212.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.212.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.213.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.213.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.213.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.214.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.214.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.214.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.215.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.215.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.215.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.216.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.216.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.216.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.217.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.217.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.217.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.218.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.218.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.218.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.219.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.219.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.219.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.22.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.22.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.22.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.220.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.220.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.220.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.221.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.221.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.221.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.222.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.222.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.222.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.223.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.223.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.223.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.224.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.224.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.224.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.225.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.225.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.225.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.226.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.226.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.226.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.227.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.227.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.227.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.228.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.228.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.228.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.229.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.229.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.229.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.23.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.23.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.23.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.230.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.230.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.230.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.231.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.231.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.231.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.232.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.232.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.232.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.233.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.233.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.233.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.234.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.234.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.234.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.235.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.235.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.235.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.236.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.236.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.236.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.237.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.237.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.237.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.238.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.238.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.238.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.239.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.239.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.239.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.24.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.24.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.24.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.240.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.240.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.240.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.241.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.241.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.241.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.242.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.242.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.242.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.243.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.243.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.243.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.244.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.244.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.244.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.245.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.245.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.245.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.246.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.246.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.246.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.247.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.247.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.247.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.248.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.248.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.248.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.249.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.249.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.249.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.25.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.25.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.25.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.250.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.250.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.250.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.251.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.251.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.251.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.252.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.252.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.252.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.253.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.253.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.253.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.254.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.254.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.254.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.255.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.255.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.255.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.26.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.26.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.26.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.27.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.27.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.27.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.28.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.28.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.28.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.29.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.29.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.29.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.3.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.3.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.3.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.30.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.30.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.30.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.31.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.31.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.31.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.32.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.32.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.32.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.33.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.33.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.33.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.34.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.34.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.34.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.35.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.35.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.35.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.36.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.36.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.36.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.37.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.37.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.37.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.38.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.38.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.38.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.39.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.39.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.39.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.4.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.4.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.4.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.40.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.40.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.40.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.41.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.41.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.41.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.42.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.42.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.42.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.43.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.43.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.43.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.44.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.44.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.44.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.45.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.45.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.45.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.46.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.46.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.46.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.47.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.47.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.47.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.48.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.48.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.48.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.49.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.49.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.49.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.5.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.5.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.5.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.50.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.50.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.50.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.51.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.51.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.51.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.52.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.52.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.52.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.53.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.53.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.53.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.54.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.54.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.54.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.55.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.55.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.55.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.56.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.56.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.56.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.57.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.57.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.57.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.58.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.58.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.58.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.59.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.59.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.59.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.6.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.6.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.6.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.60.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.60.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.60.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.61.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.61.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.61.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.62.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.62.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.62.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.63.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.63.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.63.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.64.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.64.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.64.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.65.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.65.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.65.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.66.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.66.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.66.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.67.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.67.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.67.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.68.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.68.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.68.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.69.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.69.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.69.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.7.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.7.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.7.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.70.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.70.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.70.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.71.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.71.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.71.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.72.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.72.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.72.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.73.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.73.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.73.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.74.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.74.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.74.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.75.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.75.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.75.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.76.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.76.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.76.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.77.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.77.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.77.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.78.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.78.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.78.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.79.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.79.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.79.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.8.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.8.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.8.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.80.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.80.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.80.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.81.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.81.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.81.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.82.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.82.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.82.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.83.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.83.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.83.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.84.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.84.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.84.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.85.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.85.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.85.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.86.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.86.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.86.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.87.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.87.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.87.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.88.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.88.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.88.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.89.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.89.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.89.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.9.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.9.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.9.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.90.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.90.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.90.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.91.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.91.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.91.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.92.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.92.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.92.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.93.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.93.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.93.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.94.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.94.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.94.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.95.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.95.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.95.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.96.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.96.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.96.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.97.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.97.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.97.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.98.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.98.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.98.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.99.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.99.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.experts.gate_up_proj_list.99.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.gate.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.shared_expert.down_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.shared_expert.down_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.shared_expert.down_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.shared_expert.gate_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.shared_expert.gate_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.shared_expert.gate_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.shared_expert.up_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.shared_expert.up_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.shared_expert.up_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.shared_expert_gate.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.shared_expert_gate.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.33.mlp.shared_expert_gate.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.33.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.34.input_layernorm.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.34.linear_attn.A_log": "model-00003-of-00004.safetensors", "model.language_model.layers.34.linear_attn.conv1d.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.34.linear_attn.dt_bias": "model-00003-of-00004.safetensors", "model.language_model.layers.34.linear_attn.in_proj_a.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.linear_attn.in_proj_a.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.linear_attn.in_proj_a.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.linear_attn.in_proj_b.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.linear_attn.in_proj_b.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.linear_attn.in_proj_b.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.linear_attn.in_proj_qkv.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.linear_attn.in_proj_qkv.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.linear_attn.in_proj_qkv.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.linear_attn.in_proj_z.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.linear_attn.in_proj_z.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.linear_attn.in_proj_z.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.linear_attn.norm.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.34.linear_attn.out_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.linear_attn.out_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.linear_attn.out_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.0.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.0.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.0.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.1.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.1.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.1.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.10.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.10.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.10.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.100.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.100.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.100.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.101.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.101.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.101.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.102.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.102.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.102.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.103.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.103.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.103.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.104.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.104.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.104.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.105.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.105.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.105.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.106.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.106.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.106.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.107.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.107.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.107.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.108.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.108.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.108.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.109.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.109.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.109.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.11.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.11.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.11.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.110.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.110.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.110.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.111.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.111.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.111.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.112.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.112.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.112.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.113.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.113.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.113.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.114.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.114.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.114.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.115.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.115.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.115.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.116.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.116.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.116.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.117.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.117.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.117.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.118.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.118.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.118.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.119.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.119.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.119.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.12.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.12.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.12.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.120.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.120.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.120.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.121.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.121.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.121.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.122.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.122.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.122.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.123.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.123.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.123.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.124.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.124.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.124.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.125.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.125.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.125.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.126.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.126.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.126.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.127.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.127.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.127.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.128.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.128.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.128.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.129.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.129.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.129.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.13.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.13.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.13.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.130.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.130.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.130.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.131.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.131.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.131.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.132.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.132.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.132.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.133.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.133.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.133.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.134.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.134.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.134.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.135.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.135.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.135.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.136.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.136.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.136.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.137.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.137.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.137.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.138.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.138.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.138.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.139.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.139.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.139.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.14.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.14.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.14.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.140.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.140.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.140.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.141.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.141.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.141.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.142.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.142.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.142.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.143.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.143.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.143.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.144.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.144.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.144.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.145.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.145.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.145.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.146.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.146.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.146.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.147.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.147.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.147.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.148.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.148.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.148.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.149.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.149.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.149.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.15.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.15.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.15.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.150.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.150.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.150.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.151.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.151.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.151.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.152.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.152.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.152.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.153.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.153.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.153.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.154.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.154.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.154.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.155.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.155.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.155.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.156.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.156.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.156.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.157.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.157.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.157.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.158.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.158.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.158.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.159.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.159.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.159.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.16.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.16.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.16.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.160.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.160.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.160.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.161.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.161.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.161.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.162.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.162.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.162.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.163.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.163.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.163.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.164.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.164.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.164.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.165.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.165.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.165.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.166.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.166.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.166.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.167.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.167.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.167.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.168.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.168.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.168.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.169.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.169.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.169.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.17.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.17.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.17.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.170.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.170.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.170.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.171.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.171.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.171.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.172.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.172.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.172.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.173.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.173.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.173.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.174.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.174.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.174.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.175.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.175.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.175.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.176.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.176.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.176.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.177.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.177.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.177.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.178.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.178.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.178.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.179.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.179.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.179.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.18.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.18.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.18.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.180.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.180.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.180.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.181.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.181.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.181.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.182.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.182.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.182.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.183.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.183.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.183.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.184.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.184.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.184.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.185.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.185.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.185.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.186.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.186.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.186.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.187.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.187.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.187.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.188.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.188.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.188.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.189.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.189.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.189.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.19.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.19.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.19.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.190.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.190.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.190.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.191.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.191.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.191.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.192.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.192.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.192.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.193.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.193.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.193.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.194.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.194.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.194.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.195.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.195.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.195.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.196.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.196.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.196.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.197.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.197.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.197.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.198.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.198.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.198.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.199.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.199.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.199.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.2.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.2.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.2.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.20.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.20.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.20.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.200.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.200.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.200.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.201.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.201.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.201.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.202.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.202.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.202.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.203.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.203.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.203.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.204.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.204.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.204.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.205.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.205.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.205.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.206.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.206.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.206.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.207.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.207.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.207.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.208.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.208.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.208.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.209.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.209.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.209.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.21.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.21.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.21.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.210.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.210.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.210.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.211.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.211.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.211.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.212.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.212.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.212.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.213.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.213.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.213.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.214.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.214.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.214.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.215.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.215.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.215.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.216.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.216.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.216.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.217.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.217.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.217.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.218.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.218.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.218.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.219.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.219.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.219.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.22.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.22.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.22.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.220.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.220.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.220.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.221.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.221.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.221.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.222.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.222.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.222.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.223.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.223.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.223.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.224.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.224.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.224.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.225.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.225.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.225.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.226.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.226.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.226.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.227.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.227.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.227.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.228.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.228.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.228.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.229.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.229.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.229.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.23.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.23.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.23.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.230.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.230.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.230.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.231.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.231.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.231.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.232.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.232.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.232.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.233.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.233.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.233.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.234.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.234.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.234.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.235.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.235.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.235.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.236.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.236.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.236.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.237.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.237.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.237.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.238.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.238.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.238.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.239.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.239.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.239.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.24.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.24.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.24.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.240.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.240.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.240.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.241.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.241.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.241.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.242.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.242.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.242.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.243.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.243.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.243.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.244.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.244.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.244.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.245.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.245.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.245.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.246.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.246.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.246.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.247.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.247.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.247.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.248.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.248.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.248.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.249.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.249.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.249.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.25.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.25.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.25.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.250.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.250.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.250.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.251.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.251.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.251.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.252.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.252.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.252.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.253.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.253.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.253.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.254.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.254.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.254.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.255.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.255.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.255.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.26.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.26.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.26.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.27.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.27.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.27.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.28.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.28.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.28.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.29.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.29.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.29.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.3.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.3.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.3.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.30.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.30.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.30.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.31.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.31.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.31.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.32.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.32.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.32.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.33.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.33.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.33.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.34.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.34.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.34.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.35.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.35.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.35.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.36.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.36.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.36.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.37.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.37.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.37.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.38.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.38.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.38.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.39.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.39.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.39.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.4.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.4.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.4.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.40.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.40.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.40.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.41.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.41.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.41.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.42.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.42.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.42.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.43.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.43.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.43.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.44.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.44.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.44.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.45.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.45.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.45.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.46.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.46.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.46.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.47.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.47.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.47.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.48.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.48.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.48.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.49.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.49.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.49.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.5.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.5.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.5.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.50.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.50.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.50.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.51.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.51.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.51.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.52.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.52.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.52.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.53.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.53.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.53.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.54.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.54.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.54.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.55.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.55.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.55.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.56.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.56.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.56.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.57.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.57.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.57.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.58.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.58.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.58.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.59.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.59.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.59.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.6.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.6.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.6.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.60.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.60.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.60.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.61.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.61.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.61.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.62.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.62.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.62.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.63.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.63.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.63.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.64.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.64.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.64.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.65.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.65.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.65.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.66.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.66.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.66.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.67.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.67.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.67.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.68.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.68.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.68.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.69.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.69.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.69.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.7.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.7.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.7.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.70.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.70.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.70.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.71.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.71.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.71.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.72.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.72.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.72.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.73.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.73.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.73.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.74.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.74.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.74.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.75.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.75.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.75.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.76.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.76.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.76.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.77.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.77.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.77.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.78.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.78.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.78.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.79.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.79.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.79.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.8.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.8.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.8.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.80.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.80.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.80.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.81.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.81.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.81.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.82.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.82.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.82.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.83.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.83.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.83.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.84.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.84.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.84.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.85.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.85.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.85.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.86.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.86.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.86.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.87.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.87.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.87.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.88.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.88.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.88.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.89.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.89.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.89.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.9.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.9.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.9.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.90.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.90.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.90.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.91.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.91.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.91.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.92.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.92.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.92.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.93.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.93.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.93.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.94.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.94.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.94.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.95.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.95.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.95.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.96.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.96.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.96.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.97.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.97.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.97.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.98.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.98.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.98.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.99.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.99.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.down_proj_list.99.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.0.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.0.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.0.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.1.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.1.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.1.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.10.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.10.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.10.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.100.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.100.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.100.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.101.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.101.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.101.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.102.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.102.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.102.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.103.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.103.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.103.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.104.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.104.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.104.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.105.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.105.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.105.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.106.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.106.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.106.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.107.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.107.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.107.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.108.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.108.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.108.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.109.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.109.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.109.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.11.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.11.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.11.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.110.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.110.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.110.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.111.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.111.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.111.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.112.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.112.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.112.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.113.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.113.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.113.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.114.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.114.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.114.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.115.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.115.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.115.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.116.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.116.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.116.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.117.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.117.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.117.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.118.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.118.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.118.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.119.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.119.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.119.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.12.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.12.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.12.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.120.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.120.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.120.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.121.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.121.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.121.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.122.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.122.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.122.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.123.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.123.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.123.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.124.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.124.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.124.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.125.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.125.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.125.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.126.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.126.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.126.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.127.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.127.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.127.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.128.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.128.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.128.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.129.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.129.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.129.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.13.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.13.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.13.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.130.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.130.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.130.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.131.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.131.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.131.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.132.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.132.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.132.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.133.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.133.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.133.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.134.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.134.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.134.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.135.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.135.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.135.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.136.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.136.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.136.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.137.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.137.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.137.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.138.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.138.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.138.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.139.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.139.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.139.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.14.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.14.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.14.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.140.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.140.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.140.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.141.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.141.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.141.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.142.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.142.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.142.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.143.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.143.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.143.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.144.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.144.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.144.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.145.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.145.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.145.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.146.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.146.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.146.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.147.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.147.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.147.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.148.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.148.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.148.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.149.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.149.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.149.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.15.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.15.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.15.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.150.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.150.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.150.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.151.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.151.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.151.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.152.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.152.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.152.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.153.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.153.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.153.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.154.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.154.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.154.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.155.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.155.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.155.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.156.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.156.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.156.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.157.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.157.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.157.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.158.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.158.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.158.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.159.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.159.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.159.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.16.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.16.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.16.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.160.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.160.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.160.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.161.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.161.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.161.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.162.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.162.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.162.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.163.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.163.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.163.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.164.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.164.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.164.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.165.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.165.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.165.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.166.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.166.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.166.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.167.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.167.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.167.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.168.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.168.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.168.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.169.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.169.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.169.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.17.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.17.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.17.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.170.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.170.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.170.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.171.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.171.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.171.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.172.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.172.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.172.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.173.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.173.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.173.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.174.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.174.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.174.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.175.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.175.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.175.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.176.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.176.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.176.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.177.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.177.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.177.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.178.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.178.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.178.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.179.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.179.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.179.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.18.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.18.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.18.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.180.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.180.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.180.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.181.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.181.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.181.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.182.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.182.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.182.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.183.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.183.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.183.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.184.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.184.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.184.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.185.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.185.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.185.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.186.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.186.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.186.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.187.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.187.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.187.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.188.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.188.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.188.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.189.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.189.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.189.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.19.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.19.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.19.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.190.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.190.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.190.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.191.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.191.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.191.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.192.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.192.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.192.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.193.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.193.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.193.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.194.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.194.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.194.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.195.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.195.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.195.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.196.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.196.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.196.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.197.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.197.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.197.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.198.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.198.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.198.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.199.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.199.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.199.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.2.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.2.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.2.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.20.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.20.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.20.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.200.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.200.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.200.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.201.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.201.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.201.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.202.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.202.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.202.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.203.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.203.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.203.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.204.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.204.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.204.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.205.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.205.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.205.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.206.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.206.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.206.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.207.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.207.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.207.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.208.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.208.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.208.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.209.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.209.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.209.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.21.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.21.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.21.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.210.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.210.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.210.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.211.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.211.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.211.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.212.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.212.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.212.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.213.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.213.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.213.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.214.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.214.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.214.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.215.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.215.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.215.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.216.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.216.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.216.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.217.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.217.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.217.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.218.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.218.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.218.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.219.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.219.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.219.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.22.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.22.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.22.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.220.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.220.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.220.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.221.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.221.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.221.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.222.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.222.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.222.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.223.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.223.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.223.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.224.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.224.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.224.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.225.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.225.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.225.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.226.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.226.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.226.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.227.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.227.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.227.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.228.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.228.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.228.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.229.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.229.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.229.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.23.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.23.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.23.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.230.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.230.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.230.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.231.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.231.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.231.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.232.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.232.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.232.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.233.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.233.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.233.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.234.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.234.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.234.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.235.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.235.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.235.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.236.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.236.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.236.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.237.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.237.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.237.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.238.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.238.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.238.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.239.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.239.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.239.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.24.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.24.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.24.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.240.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.240.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.240.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.241.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.241.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.241.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.242.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.242.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.242.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.243.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.243.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.243.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.244.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.244.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.244.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.245.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.245.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.245.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.246.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.246.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.246.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.247.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.247.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.247.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.248.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.248.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.248.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.249.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.249.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.249.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.25.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.25.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.25.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.250.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.250.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.250.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.251.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.251.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.251.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.252.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.252.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.252.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.253.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.253.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.253.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.254.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.254.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.254.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.255.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.255.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.255.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.26.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.26.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.26.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.27.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.27.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.27.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.28.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.28.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.28.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.29.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.29.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.29.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.3.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.3.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.3.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.30.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.30.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.30.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.31.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.31.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.31.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.32.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.32.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.32.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.33.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.33.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.33.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.34.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.34.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.34.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.35.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.35.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.35.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.36.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.36.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.36.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.37.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.37.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.37.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.38.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.38.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.38.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.39.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.39.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.39.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.4.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.4.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.4.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.40.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.40.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.40.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.41.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.41.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.41.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.42.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.42.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.42.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.43.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.43.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.43.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.44.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.44.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.44.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.45.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.45.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.45.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.46.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.46.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.46.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.47.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.47.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.47.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.48.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.48.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.48.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.49.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.49.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.49.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.5.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.5.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.5.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.50.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.50.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.50.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.51.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.51.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.51.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.52.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.52.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.52.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.53.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.53.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.53.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.54.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.54.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.54.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.55.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.55.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.55.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.56.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.56.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.56.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.57.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.57.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.57.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.58.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.58.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.58.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.59.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.59.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.59.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.6.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.6.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.6.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.60.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.60.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.60.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.61.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.61.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.61.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.62.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.62.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.62.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.63.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.63.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.63.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.64.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.64.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.64.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.65.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.65.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.65.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.66.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.66.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.66.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.67.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.67.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.67.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.68.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.68.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.68.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.69.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.69.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.69.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.7.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.7.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.7.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.70.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.70.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.70.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.71.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.71.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.71.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.72.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.72.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.72.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.73.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.73.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.73.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.74.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.74.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.74.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.75.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.75.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.75.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.76.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.76.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.76.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.77.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.77.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.77.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.78.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.78.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.78.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.79.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.79.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.79.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.8.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.8.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.8.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.80.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.80.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.80.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.81.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.81.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.81.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.82.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.82.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.82.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.83.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.83.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.83.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.84.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.84.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.84.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.85.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.85.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.85.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.86.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.86.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.86.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.87.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.87.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.87.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.88.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.88.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.88.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.89.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.89.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.89.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.9.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.9.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.9.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.90.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.90.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.90.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.91.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.91.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.91.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.92.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.92.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.92.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.93.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.93.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.93.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.94.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.94.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.94.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.95.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.95.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.95.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.96.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.96.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.96.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.97.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.97.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.97.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.98.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.98.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.98.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.99.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.99.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.experts.gate_up_proj_list.99.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.gate.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.shared_expert.down_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.shared_expert.down_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.shared_expert.down_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.shared_expert.gate_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.shared_expert.gate_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.shared_expert.gate_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.shared_expert.up_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.shared_expert.up_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.shared_expert.up_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.shared_expert_gate.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.shared_expert_gate.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.34.mlp.shared_expert_gate.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.34.post_attention_layernorm.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.35.input_layernorm.weight": "model-00004-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.0.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.0.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.0.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.1.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.1.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.1.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.10.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.10.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.10.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.100.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.100.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.100.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.101.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.101.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.101.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.102.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.102.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.102.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.103.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.103.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.103.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.104.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.104.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.104.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.105.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.105.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.105.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.106.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.106.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.106.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.107.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.107.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.107.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.108.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.108.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.108.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.109.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.109.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.109.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.11.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.11.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.11.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.110.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.110.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.110.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.111.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.111.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.111.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.112.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.112.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.112.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.113.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.113.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.113.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.114.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.114.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.114.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.115.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.115.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.115.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.116.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.116.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.116.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.117.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.117.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.117.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.118.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.118.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.118.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.119.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.119.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.119.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.12.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.12.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.12.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.120.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.120.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.120.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.121.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.121.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.121.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.122.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.122.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.122.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.123.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.123.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.123.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.124.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.124.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.124.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.125.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.125.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.125.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.126.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.126.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.126.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.127.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.127.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.127.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.128.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.128.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.128.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.129.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.129.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.129.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.13.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.13.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.13.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.130.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.130.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.130.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.131.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.131.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.131.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.132.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.132.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.132.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.133.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.133.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.133.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.134.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.134.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.134.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.135.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.135.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.135.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.136.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.136.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.136.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.137.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.137.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.137.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.138.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.138.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.138.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.139.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.139.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.139.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.14.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.14.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.14.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.140.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.140.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.140.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.141.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.141.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.141.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.142.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.142.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.142.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.143.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.143.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.143.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.144.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.144.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.144.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.145.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.145.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.145.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.146.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.146.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.146.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.147.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.147.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.147.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.148.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.148.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.148.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.149.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.149.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.149.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.15.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.15.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.15.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.150.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.150.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.150.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.151.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.151.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.151.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.152.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.152.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.152.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.153.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.153.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.153.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.154.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.154.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.154.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.155.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.155.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.155.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.156.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.156.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.156.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.157.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.157.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.157.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.158.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.158.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.158.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.159.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.159.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.159.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.16.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.16.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.16.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.160.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.160.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.160.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.161.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.161.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.161.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.162.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.162.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.162.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.163.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.163.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.163.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.164.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.164.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.164.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.165.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.165.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.165.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.166.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.166.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.166.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.167.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.167.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.167.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.168.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.168.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.168.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.169.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.169.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.169.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.17.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.17.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.17.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.170.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.170.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.170.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.171.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.171.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.171.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.172.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.172.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.172.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.173.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.173.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.173.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.174.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.174.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.174.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.175.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.175.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.175.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.176.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.176.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.176.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.177.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.177.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.177.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.178.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.178.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.178.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.179.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.179.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.179.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.18.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.18.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.18.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.180.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.180.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.180.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.181.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.181.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.181.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.182.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.182.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.182.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.183.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.183.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.183.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.184.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.184.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.184.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.185.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.185.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.185.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.186.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.186.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.186.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.187.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.187.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.187.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.188.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.188.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.188.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.189.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.189.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.189.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.19.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.19.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.19.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.190.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.190.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.190.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.191.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.191.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.191.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.192.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.192.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.192.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.193.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.193.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.193.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.194.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.194.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.194.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.195.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.195.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.195.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.196.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.196.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.196.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.197.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.197.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.197.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.198.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.198.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.198.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.199.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.199.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.199.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.2.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.2.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.2.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.20.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.20.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.20.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.200.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.200.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.200.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.201.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.201.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.201.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.202.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.202.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.202.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.203.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.203.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.203.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.204.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.204.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.204.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.205.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.205.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.205.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.206.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.206.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.206.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.207.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.207.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.207.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.208.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.208.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.208.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.209.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.209.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.209.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.21.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.21.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.21.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.210.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.210.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.210.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.211.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.211.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.211.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.212.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.212.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.212.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.213.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.213.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.213.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.214.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.214.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.214.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.215.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.215.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.215.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.216.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.216.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.216.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.217.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.217.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.217.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.218.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.218.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.218.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.219.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.219.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.219.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.22.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.22.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.22.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.220.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.220.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.220.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.221.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.221.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.221.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.222.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.222.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.222.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.223.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.223.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.223.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.224.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.224.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.224.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.225.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.225.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.225.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.226.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.226.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.226.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.227.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.227.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.227.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.228.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.228.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.228.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.229.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.229.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.229.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.23.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.23.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.23.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.230.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.230.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.230.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.231.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.231.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.231.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.232.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.232.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.232.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.233.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.233.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.233.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.234.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.234.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.234.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.235.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.235.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.235.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.236.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.236.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.236.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.237.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.237.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.237.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.238.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.238.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.238.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.239.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.239.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.239.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.24.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.24.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.24.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.240.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.240.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.240.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.241.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.241.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.241.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.242.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.242.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.242.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.243.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.243.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.243.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.244.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.244.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.244.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.245.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.245.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.245.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.246.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.246.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.246.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.247.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.247.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.247.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.248.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.248.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.248.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.249.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.249.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.249.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.25.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.25.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.25.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.250.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.250.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.250.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.251.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.251.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.251.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.252.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.252.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.252.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.253.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.253.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.253.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.254.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.254.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.254.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.255.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.255.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.255.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.26.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.26.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.26.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.27.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.27.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.27.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.28.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.28.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.28.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.29.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.29.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.29.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.3.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.3.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.3.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.30.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.30.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.30.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.31.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.31.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.31.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.32.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.32.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.32.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.33.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.33.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.33.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.34.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.34.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.34.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.35.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.35.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.35.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.36.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.36.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.36.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.37.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.37.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.37.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.38.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.38.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.38.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.39.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.39.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.39.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.4.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.4.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.4.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.40.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.40.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.40.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.41.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.41.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.41.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.42.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.42.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.42.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.43.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.43.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.43.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.44.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.44.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.44.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.45.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.45.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.45.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.46.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.46.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.46.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.47.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.47.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.47.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.48.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.48.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.48.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.49.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.49.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.49.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.5.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.5.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.5.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.50.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.50.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.50.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.51.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.51.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.51.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.52.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.52.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.52.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.53.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.53.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.53.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.54.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.54.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.54.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.55.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.55.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.55.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.56.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.56.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.56.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.57.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.57.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.57.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.58.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.58.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.58.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.59.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.59.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.59.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.6.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.6.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.6.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.60.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.60.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.60.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.61.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.61.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.61.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.62.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.62.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.62.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.63.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.63.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.63.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.64.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.64.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.64.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.65.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.65.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.65.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.66.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.66.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.66.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.67.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.67.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.67.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.68.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.68.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.68.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.69.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.69.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.69.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.7.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.7.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.7.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.70.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.70.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.70.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.71.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.71.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.71.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.72.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.72.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.72.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.73.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.73.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.73.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.74.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.74.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.74.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.75.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.75.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.75.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.76.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.76.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.76.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.77.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.77.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.77.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.78.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.78.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.78.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.79.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.79.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.79.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.8.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.8.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.8.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.80.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.80.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.80.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.81.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.81.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.81.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.82.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.82.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.82.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.83.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.83.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.83.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.84.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.84.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.84.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.85.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.85.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.85.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.86.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.86.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.86.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.87.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.87.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.87.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.88.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.88.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.88.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.89.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.89.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.89.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.9.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.9.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.9.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.90.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.90.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.90.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.91.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.91.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.91.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.92.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.92.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.92.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.93.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.93.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.93.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.94.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.94.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.94.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.95.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.95.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.95.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.96.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.96.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.96.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.97.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.97.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.97.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.98.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.98.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.98.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.99.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.99.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.down_proj_list.99.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.0.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.0.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.0.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.1.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.1.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.1.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.10.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.10.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.10.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.100.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.100.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.100.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.101.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.101.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.101.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.102.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.102.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.102.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.103.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.103.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.103.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.104.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.104.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.104.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.105.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.105.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.105.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.106.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.106.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.106.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.107.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.107.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.107.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.108.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.108.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.108.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.109.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.109.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.109.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.11.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.11.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.11.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.110.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.110.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.110.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.111.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.111.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.111.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.112.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.112.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.112.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.113.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.113.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.113.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.114.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.114.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.114.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.115.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.115.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.115.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.116.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.116.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.116.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.117.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.117.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.117.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.118.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.118.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.118.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.119.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.119.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.119.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.12.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.12.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.12.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.120.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.120.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.120.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.121.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.121.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.121.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.122.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.122.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.122.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.123.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.123.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.123.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.124.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.124.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.124.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.125.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.125.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.125.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.126.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.126.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.126.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.127.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.127.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.127.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.128.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.128.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.128.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.129.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.129.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.129.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.13.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.13.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.13.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.130.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.130.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.130.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.131.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.131.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.131.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.132.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.132.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.132.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.133.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.133.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.133.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.134.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.134.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.134.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.135.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.135.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.135.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.136.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.136.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.136.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.137.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.137.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.137.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.138.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.138.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.138.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.139.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.139.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.139.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.14.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.14.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.14.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.140.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.140.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.140.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.141.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.141.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.141.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.142.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.142.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.142.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.143.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.143.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.143.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.144.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.144.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.144.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.145.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.145.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.145.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.146.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.146.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.146.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.147.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.147.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.147.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.148.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.148.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.148.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.149.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.149.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.149.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.15.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.15.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.15.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.150.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.150.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.150.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.151.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.151.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.151.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.152.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.152.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.152.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.153.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.153.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.153.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.154.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.154.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.154.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.155.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.155.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.155.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.156.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.156.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.156.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.157.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.157.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.157.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.158.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.158.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.158.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.159.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.159.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.159.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.16.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.16.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.16.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.160.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.160.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.160.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.161.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.161.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.161.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.162.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.162.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.162.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.163.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.163.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.163.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.164.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.164.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.164.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.165.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.165.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.165.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.166.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.166.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.166.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.167.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.167.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.167.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.168.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.168.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.168.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.169.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.169.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.169.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.17.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.17.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.17.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.170.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.170.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.170.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.171.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.171.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.171.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.172.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.172.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.172.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.173.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.173.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.173.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.174.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.174.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.174.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.175.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.175.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.175.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.176.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.176.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.176.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.177.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.177.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.177.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.178.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.178.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.178.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.179.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.179.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.179.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.18.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.18.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.18.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.180.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.180.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.180.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.181.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.181.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.181.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.182.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.182.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.182.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.183.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.183.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.183.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.184.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.184.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.184.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.185.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.185.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.185.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.186.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.186.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.186.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.187.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.187.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.187.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.188.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.188.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.188.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.189.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.189.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.189.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.19.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.19.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.19.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.190.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.190.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.190.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.191.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.191.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.191.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.192.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.192.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.192.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.193.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.193.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.193.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.194.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.194.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.194.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.195.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.195.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.195.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.196.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.196.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.196.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.197.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.197.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.197.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.198.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.198.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.198.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.199.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.199.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.199.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.2.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.2.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.2.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.20.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.20.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.20.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.200.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.200.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.200.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.201.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.201.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.201.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.202.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.202.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.202.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.203.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.203.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.203.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.204.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.204.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.204.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.205.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.205.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.205.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.206.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.206.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.206.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.207.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.207.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.207.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.208.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.208.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.208.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.209.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.209.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.209.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.21.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.21.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.21.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.210.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.210.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.210.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.211.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.211.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.211.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.212.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.212.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.212.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.213.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.213.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.213.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.214.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.214.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.214.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.215.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.215.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.215.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.216.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.216.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.216.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.217.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.217.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.217.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.218.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.218.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.218.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.219.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.219.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.219.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.22.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.22.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.22.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.220.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.220.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.220.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.221.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.221.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.221.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.222.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.222.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.222.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.223.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.223.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.223.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.224.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.224.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.224.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.225.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.225.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.225.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.226.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.226.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.226.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.227.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.227.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.227.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.228.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.228.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.228.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.229.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.229.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.229.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.23.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.23.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.23.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.230.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.230.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.230.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.231.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.231.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.231.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.232.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.232.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.232.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.233.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.233.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.233.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.234.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.234.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.234.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.235.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.235.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.235.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.236.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.236.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.236.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.237.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.237.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.237.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.238.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.238.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.238.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.239.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.239.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.239.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.24.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.24.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.24.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.240.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.240.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.240.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.241.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.241.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.241.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.242.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.242.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.242.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.243.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.243.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.243.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.244.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.244.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.244.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.245.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.245.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.245.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.246.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.246.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.246.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.247.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.247.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.247.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.248.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.248.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.248.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.249.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.249.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.249.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.25.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.25.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.25.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.250.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.250.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.250.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.251.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.251.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.251.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.252.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.252.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.252.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.253.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.253.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.253.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.254.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.254.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.254.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.255.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.255.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.255.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.26.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.26.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.26.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.27.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.27.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.27.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.28.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.28.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.28.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.29.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.29.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.29.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.3.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.3.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.3.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.30.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.30.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.30.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.31.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.31.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.31.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.32.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.32.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.32.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.33.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.33.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.33.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.34.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.34.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.34.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.35.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.35.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.35.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.36.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.36.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.36.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.37.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.37.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.37.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.38.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.38.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.38.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.39.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.39.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.39.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.4.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.4.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.4.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.40.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.40.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.40.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.41.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.41.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.41.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.42.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.42.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.42.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.43.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.43.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.43.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.44.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.44.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.44.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.45.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.45.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.45.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.46.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.46.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.46.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.47.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.47.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.47.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.48.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.48.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.48.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.49.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.49.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.49.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.5.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.5.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.5.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.50.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.50.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.50.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.51.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.51.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.51.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.52.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.52.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.52.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.53.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.53.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.53.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.54.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.54.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.54.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.55.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.55.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.55.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.56.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.56.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.56.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.57.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.57.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.57.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.58.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.58.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.58.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.59.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.59.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.59.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.6.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.6.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.6.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.60.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.60.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.60.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.61.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.61.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.61.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.62.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.62.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.62.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.63.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.63.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.63.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.64.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.64.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.64.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.65.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.65.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.65.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.66.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.66.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.66.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.67.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.67.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.67.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.68.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.68.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.68.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.69.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.69.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.69.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.7.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.7.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.7.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.70.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.70.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.70.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.71.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.71.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.71.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.72.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.72.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.72.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.73.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.73.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.73.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.74.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.74.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.74.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.75.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.75.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.75.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.76.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.76.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.76.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.77.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.77.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.77.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.78.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.78.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.78.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.79.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.79.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.79.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.8.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.8.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.8.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.80.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.80.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.80.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.81.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.81.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.81.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.82.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.82.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.82.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.83.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.83.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.83.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.84.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.84.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.84.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.85.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.85.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.85.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.86.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.86.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.86.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.87.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.87.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.87.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.88.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.88.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.88.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.89.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.89.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.89.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.9.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.9.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.9.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.90.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.90.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.90.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.91.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.91.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.91.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.92.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.92.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.92.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.93.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.93.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.93.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.94.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.94.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.94.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.95.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.95.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.95.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.96.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.96.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.96.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.97.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.97.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.97.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.98.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.98.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.98.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.99.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.99.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.experts.gate_up_proj_list.99.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.gate.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.shared_expert.down_proj.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.35.mlp.shared_expert.down_proj.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.35.mlp.shared_expert.down_proj.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.35.mlp.shared_expert.gate_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.shared_expert.gate_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.shared_expert.gate_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.mlp.shared_expert.up_proj.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.35.mlp.shared_expert.up_proj.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.35.mlp.shared_expert.up_proj.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.35.mlp.shared_expert_gate.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.35.mlp.shared_expert_gate.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.35.mlp.shared_expert_gate.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.35.post_attention_layernorm.weight": "model-00004-of-00004.safetensors", "model.language_model.layers.35.self_attn.k_norm.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.35.self_attn.k_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.self_attn.k_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.self_attn.k_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.self_attn.o_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.self_attn.o_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.self_attn.o_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.self_attn.q_norm.weight": "model-00003-of-00004.safetensors", "model.language_model.layers.35.self_attn.q_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.self_attn.q_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.self_attn.q_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.35.self_attn.v_proj.W_q_packed": "model-00003-of-00004.safetensors", "model.language_model.layers.35.self_attn.v_proj.scale": "model-00003-of-00004.safetensors", "model.language_model.layers.35.self_attn.v_proj.zero": "model-00003-of-00004.safetensors", "model.language_model.layers.36.input_layernorm.weight": "model-00004-of-00004.safetensors", "model.language_model.layers.36.linear_attn.A_log": "model-00004-of-00004.safetensors", "model.language_model.layers.36.linear_attn.conv1d.weight": "model-00004-of-00004.safetensors", "model.language_model.layers.36.linear_attn.dt_bias": "model-00004-of-00004.safetensors", "model.language_model.layers.36.linear_attn.in_proj_a.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.linear_attn.in_proj_a.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.linear_attn.in_proj_a.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.linear_attn.in_proj_b.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.linear_attn.in_proj_b.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.linear_attn.in_proj_b.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.linear_attn.in_proj_qkv.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.linear_attn.in_proj_qkv.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.linear_attn.in_proj_qkv.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.linear_attn.in_proj_z.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.linear_attn.in_proj_z.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.linear_attn.in_proj_z.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.linear_attn.norm.weight": "model-00004-of-00004.safetensors", "model.language_model.layers.36.linear_attn.out_proj.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.linear_attn.out_proj.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.linear_attn.out_proj.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.0.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.0.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.0.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.1.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.1.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.1.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.10.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.10.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.10.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.100.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.100.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.100.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.101.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.101.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.101.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.102.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.102.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.102.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.103.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.103.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.103.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.104.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.104.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.104.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.105.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.105.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.105.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.106.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.106.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.106.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.107.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.107.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.107.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.108.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.108.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.108.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.109.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.109.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.109.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.11.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.11.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.11.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.110.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.110.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.110.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.111.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.111.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.111.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.112.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.112.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.112.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.113.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.113.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.113.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.114.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.114.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.114.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.115.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.115.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.115.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.116.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.116.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.116.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.117.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.117.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.117.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.118.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.118.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.118.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.119.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.119.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.119.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.12.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.12.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.12.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.120.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.120.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.120.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.121.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.121.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.121.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.122.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.122.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.122.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.123.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.123.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.123.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.124.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.124.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.124.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.125.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.125.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.125.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.126.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.126.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.126.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.127.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.127.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.127.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.128.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.128.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.128.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.129.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.129.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.129.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.13.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.13.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.13.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.130.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.130.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.130.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.131.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.131.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.131.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.132.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.132.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.132.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.133.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.133.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.133.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.134.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.134.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.134.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.135.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.135.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.135.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.136.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.136.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.136.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.137.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.137.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.137.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.138.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.138.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.138.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.139.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.139.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.139.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.14.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.14.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.14.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.140.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.140.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.140.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.141.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.141.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.141.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.142.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.142.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.142.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.143.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.143.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.143.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.144.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.144.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.144.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.145.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.145.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.145.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.146.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.146.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.146.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.147.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.147.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.147.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.148.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.148.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.148.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.149.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.149.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.149.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.15.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.15.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.15.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.150.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.150.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.150.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.151.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.151.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.151.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.152.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.152.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.152.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.153.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.153.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.153.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.154.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.154.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.154.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.155.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.155.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.155.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.156.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.156.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.156.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.157.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.157.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.157.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.158.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.158.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.158.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.159.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.159.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.159.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.16.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.16.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.16.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.160.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.160.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.160.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.161.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.161.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.161.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.162.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.162.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.162.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.163.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.163.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.163.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.164.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.164.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.164.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.165.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.165.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.165.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.166.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.166.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.166.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.167.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.167.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.167.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.168.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.168.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.168.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.169.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.169.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.169.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.17.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.17.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.17.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.170.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.170.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.170.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.171.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.171.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.171.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.172.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.172.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.172.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.173.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.173.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.173.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.174.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.174.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.174.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.175.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.175.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.175.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.176.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.176.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.176.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.177.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.177.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.177.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.178.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.178.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.178.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.179.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.179.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.179.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.18.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.18.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.18.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.180.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.180.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.180.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.181.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.181.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.181.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.182.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.182.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.182.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.183.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.183.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.183.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.184.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.184.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.184.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.185.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.185.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.185.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.186.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.186.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.186.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.187.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.187.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.187.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.188.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.188.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.188.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.189.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.189.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.189.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.19.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.19.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.19.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.190.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.190.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.190.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.191.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.191.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.191.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.192.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.192.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.192.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.193.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.193.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.193.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.194.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.194.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.194.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.195.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.195.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.195.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.196.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.196.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.196.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.197.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.197.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.197.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.198.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.198.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.198.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.199.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.199.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.199.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.2.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.2.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.2.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.20.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.20.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.20.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.200.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.200.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.200.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.201.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.201.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.201.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.202.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.202.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.202.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.203.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.203.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.203.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.204.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.204.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.204.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.205.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.205.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.205.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.206.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.206.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.206.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.207.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.207.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.207.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.208.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.208.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.208.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.209.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.209.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.209.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.21.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.21.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.21.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.210.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.210.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.210.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.211.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.211.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.211.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.212.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.212.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.212.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.213.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.213.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.213.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.214.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.214.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.214.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.215.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.215.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.215.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.216.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.216.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.216.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.217.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.217.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.217.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.218.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.218.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.218.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.219.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.219.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.219.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.22.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.22.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.22.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.220.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.220.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.220.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.221.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.221.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.221.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.222.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.222.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.222.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.223.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.223.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.223.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.224.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.224.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.224.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.225.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.225.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.225.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.226.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.226.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.226.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.227.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.227.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.227.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.228.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.228.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.228.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.229.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.229.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.229.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.23.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.23.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.23.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.230.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.230.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.230.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.231.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.231.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.231.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.232.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.232.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.232.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.233.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.233.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.233.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.234.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.234.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.234.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.235.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.235.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.235.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.236.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.236.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.236.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.237.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.237.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.237.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.238.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.238.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.238.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.239.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.239.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.239.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.24.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.24.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.24.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.240.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.240.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.240.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.241.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.241.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.241.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.242.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.242.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.242.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.243.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.243.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.243.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.244.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.244.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.244.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.245.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.245.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.245.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.246.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.246.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.246.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.247.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.247.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.247.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.248.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.248.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.248.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.249.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.249.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.249.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.25.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.25.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.25.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.250.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.250.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.250.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.251.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.251.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.251.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.252.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.252.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.252.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.253.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.253.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.253.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.254.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.254.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.254.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.255.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.255.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.255.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.26.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.26.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.26.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.27.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.27.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.27.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.28.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.28.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.28.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.29.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.29.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.29.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.3.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.3.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.3.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.30.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.30.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.30.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.31.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.31.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.31.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.32.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.32.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.32.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.33.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.33.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.33.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.34.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.34.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.34.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.35.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.35.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.35.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.36.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.36.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.36.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.37.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.37.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.37.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.38.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.38.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.38.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.39.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.39.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.39.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.4.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.4.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.4.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.40.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.40.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.40.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.41.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.41.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.41.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.42.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.42.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.42.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.43.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.43.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.43.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.44.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.44.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.44.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.45.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.45.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.45.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.46.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.46.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.46.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.47.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.47.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.47.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.48.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.48.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.48.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.49.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.49.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.49.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.5.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.5.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.5.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.50.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.50.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.50.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.51.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.51.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.51.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.52.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.52.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.52.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.53.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.53.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.53.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.54.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.54.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.54.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.55.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.55.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.55.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.56.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.56.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.56.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.57.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.57.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.57.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.58.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.58.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.58.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.59.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.59.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.59.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.6.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.6.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.6.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.60.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.60.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.60.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.61.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.61.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.61.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.62.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.62.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.62.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.63.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.63.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.63.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.64.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.64.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.64.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.65.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.65.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.65.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.66.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.66.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.66.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.67.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.67.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.67.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.68.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.68.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.68.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.69.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.69.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.69.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.7.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.7.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.7.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.70.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.70.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.70.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.71.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.71.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.71.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.72.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.72.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.72.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.73.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.73.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.73.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.74.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.74.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.74.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.75.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.75.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.75.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.76.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.76.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.76.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.77.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.77.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.77.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.78.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.78.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.78.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.79.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.79.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.79.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.8.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.8.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.8.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.80.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.80.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.80.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.81.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.81.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.81.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.82.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.82.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.82.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.83.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.83.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.83.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.84.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.84.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.84.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.85.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.85.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.85.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.86.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.86.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.86.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.87.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.87.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.87.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.88.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.88.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.88.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.89.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.89.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.89.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.9.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.9.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.9.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.90.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.90.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.90.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.91.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.91.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.91.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.92.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.92.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.92.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.93.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.93.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.93.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.94.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.94.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.94.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.95.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.95.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.95.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.96.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.96.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.96.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.97.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.97.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.97.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.98.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.98.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.98.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.99.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.99.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.down_proj_list.99.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.0.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.0.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.0.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.1.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.1.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.1.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.10.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.10.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.10.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.100.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.100.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.100.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.101.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.101.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.101.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.102.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.102.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.102.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.103.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.103.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.103.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.104.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.104.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.104.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.105.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.105.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.105.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.106.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.106.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.106.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.107.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.107.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.107.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.108.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.108.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.108.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.109.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.109.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.109.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.11.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.11.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.11.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.110.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.110.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.110.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.111.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.111.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.111.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.112.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.112.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.112.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.113.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.113.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.113.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.114.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.114.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.114.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.115.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.115.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.115.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.116.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.116.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.116.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.117.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.117.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.117.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.118.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.118.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.118.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.119.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.119.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.119.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.12.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.12.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.12.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.120.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.120.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.120.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.121.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.121.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.121.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.122.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.122.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.122.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.123.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.123.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.123.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.124.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.124.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.124.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.125.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.125.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.125.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.126.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.126.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.126.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.127.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.127.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.127.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.128.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.128.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.128.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.129.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.129.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.129.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.13.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.13.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.13.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.130.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.130.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.130.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.131.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.131.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.131.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.132.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.132.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.132.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.133.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.133.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.133.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.134.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.134.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.134.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.135.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.135.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.135.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.136.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.136.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.136.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.137.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.137.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.137.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.138.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.138.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.138.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.139.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.139.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.139.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.14.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.14.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.14.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.140.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.140.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.140.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.141.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.141.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.141.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.142.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.142.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.142.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.143.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.143.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.143.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.144.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.144.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.144.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.145.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.145.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.145.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.146.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.146.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.146.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.147.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.147.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.147.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.148.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.148.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.148.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.149.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.149.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.149.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.15.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.15.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.15.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.150.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.150.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.150.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.151.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.151.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.151.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.152.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.152.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.152.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.153.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.153.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.153.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.154.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.154.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.154.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.155.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.155.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.155.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.156.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.156.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.156.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.157.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.157.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.157.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.158.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.158.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.158.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.159.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.159.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.159.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.16.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.16.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.16.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.160.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.160.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.160.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.161.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.161.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.161.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.162.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.162.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.162.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.163.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.163.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.163.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.164.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.164.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.164.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.165.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.165.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.165.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.166.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.166.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.166.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.167.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.167.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.167.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.168.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.168.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.168.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.169.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.169.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.169.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.17.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.17.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.17.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.170.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.170.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.170.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.171.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.171.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.171.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.172.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.172.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.172.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.173.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.173.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.173.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.174.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.174.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.174.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.175.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.175.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.175.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.176.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.176.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.176.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.177.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.177.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.177.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.178.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.178.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.178.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.179.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.179.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.179.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.18.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.18.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.18.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.180.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.180.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.180.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.181.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.181.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.181.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.182.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.182.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.182.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.183.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.183.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.183.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.184.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.184.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.184.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.185.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.185.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.185.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.186.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.186.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.186.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.187.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.187.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.187.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.188.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.188.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.188.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.189.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.189.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.189.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.19.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.19.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.19.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.190.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.190.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.190.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.191.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.191.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.191.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.192.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.192.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.192.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.193.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.193.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.193.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.194.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.194.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.194.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.195.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.195.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.195.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.196.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.196.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.196.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.197.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.197.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.197.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.198.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.198.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.198.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.199.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.199.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.199.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.2.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.2.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.2.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.20.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.20.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.20.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.200.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.200.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.200.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.201.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.201.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.201.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.202.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.202.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.202.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.203.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.203.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.203.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.204.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.204.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.204.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.205.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.205.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.205.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.206.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.206.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.206.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.207.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.207.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.207.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.208.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.208.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.208.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.209.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.209.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.209.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.21.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.21.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.21.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.210.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.210.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.210.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.211.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.211.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.211.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.212.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.212.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.212.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.213.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.213.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.213.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.214.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.214.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.214.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.215.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.215.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.215.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.216.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.216.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.216.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.217.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.217.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.217.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.218.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.218.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.218.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.219.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.219.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.219.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.22.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.22.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.22.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.220.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.220.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.220.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.221.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.221.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.221.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.222.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.222.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.222.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.223.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.223.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.223.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.224.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.224.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.224.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.225.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.225.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.225.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.226.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.226.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.226.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.227.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.227.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.227.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.228.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.228.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.228.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.229.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.229.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.229.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.23.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.23.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.23.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.230.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.230.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.230.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.231.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.231.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.231.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.232.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.232.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.232.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.233.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.233.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.233.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.234.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.234.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.234.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.235.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.235.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.235.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.236.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.236.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.236.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.237.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.237.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.237.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.238.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.238.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.238.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.239.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.239.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.239.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.24.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.24.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.24.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.240.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.240.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.240.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.241.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.241.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.241.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.242.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.242.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.242.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.243.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.243.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.243.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.244.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.244.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.244.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.245.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.245.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.245.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.246.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.246.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.246.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.247.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.247.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.247.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.248.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.248.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.248.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.249.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.249.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.249.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.25.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.25.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.25.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.250.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.250.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.250.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.251.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.251.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.251.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.252.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.252.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.252.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.253.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.253.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.253.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.254.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.254.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.254.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.255.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.255.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.255.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.26.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.26.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.26.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.27.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.27.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.27.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.28.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.28.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.28.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.29.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.29.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.29.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.3.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.3.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.3.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.30.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.30.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.30.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.31.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.31.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.31.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.32.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.32.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.32.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.33.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.33.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.33.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.34.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.34.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.34.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.35.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.35.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.35.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.36.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.36.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.36.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.37.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.37.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.37.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.38.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.38.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.38.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.39.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.39.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.39.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.4.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.4.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.4.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.40.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.40.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.40.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.41.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.41.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.41.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.42.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.42.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.42.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.43.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.43.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.43.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.44.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.44.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.44.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.45.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.45.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.45.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.46.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.46.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.46.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.47.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.47.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.47.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.48.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.48.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.48.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.49.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.49.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.49.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.5.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.5.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.5.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.50.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.50.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.50.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.51.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.51.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.51.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.52.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.52.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.52.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.53.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.53.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.53.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.54.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.54.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.54.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.55.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.55.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.55.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.56.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.56.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.56.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.57.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.57.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.57.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.58.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.58.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.58.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.59.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.59.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.59.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.6.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.6.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.6.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.60.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.60.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.60.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.61.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.61.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.61.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.62.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.62.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.62.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.63.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.63.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.63.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.64.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.64.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.64.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.65.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.65.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.65.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.66.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.66.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.66.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.67.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.67.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.67.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.68.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.68.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.68.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.69.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.69.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.69.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.7.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.7.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.7.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.70.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.70.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.70.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.71.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.71.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.71.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.72.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.72.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.72.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.73.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.73.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.73.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.74.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.74.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.74.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.75.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.75.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.75.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.76.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.76.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.76.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.77.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.77.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.77.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.78.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.78.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.78.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.79.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.79.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.79.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.8.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.8.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.8.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.80.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.80.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.80.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.81.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.81.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.81.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.82.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.82.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.82.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.83.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.83.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.83.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.84.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.84.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.84.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.85.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.85.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.85.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.86.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.86.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.86.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.87.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.87.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.87.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.88.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.88.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.88.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.89.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.89.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.89.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.9.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.9.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.9.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.90.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.90.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.90.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.91.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.91.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.91.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.92.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.92.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.92.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.93.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.93.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.93.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.94.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.94.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.94.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.95.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.95.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.95.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.96.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.96.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.96.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.97.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.97.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.97.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.98.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.98.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.98.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.99.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.99.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.experts.gate_up_proj_list.99.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.gate.weight": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.shared_expert.down_proj.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.shared_expert.down_proj.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.shared_expert.down_proj.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.shared_expert.gate_proj.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.shared_expert.gate_proj.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.shared_expert.gate_proj.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.shared_expert.up_proj.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.shared_expert.up_proj.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.shared_expert.up_proj.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.shared_expert_gate.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.shared_expert_gate.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.36.mlp.shared_expert_gate.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.36.post_attention_layernorm.weight": "model-00004-of-00004.safetensors", "model.language_model.layers.37.input_layernorm.weight": "model-00004-of-00004.safetensors", "model.language_model.layers.37.linear_attn.A_log": "model-00004-of-00004.safetensors", "model.language_model.layers.37.linear_attn.conv1d.weight": "model-00004-of-00004.safetensors", "model.language_model.layers.37.linear_attn.dt_bias": "model-00004-of-00004.safetensors", "model.language_model.layers.37.linear_attn.in_proj_a.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.linear_attn.in_proj_a.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.linear_attn.in_proj_a.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.linear_attn.in_proj_b.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.linear_attn.in_proj_b.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.linear_attn.in_proj_b.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.linear_attn.in_proj_qkv.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.linear_attn.in_proj_qkv.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.linear_attn.in_proj_qkv.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.linear_attn.in_proj_z.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.linear_attn.in_proj_z.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.linear_attn.in_proj_z.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.linear_attn.norm.weight": "model-00004-of-00004.safetensors", "model.language_model.layers.37.linear_attn.out_proj.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.linear_attn.out_proj.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.linear_attn.out_proj.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.0.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.0.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.0.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.1.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.1.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.1.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.10.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.10.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.10.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.100.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.100.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.100.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.101.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.101.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.101.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.102.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.102.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.102.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.103.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.103.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.103.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.104.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.104.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.104.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.105.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.105.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.105.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.106.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.106.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.106.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.107.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.107.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.107.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.108.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.108.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.108.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.109.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.109.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.109.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.11.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.11.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.11.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.110.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.110.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.110.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.111.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.111.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.111.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.112.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.112.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.112.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.113.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.113.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.113.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.114.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.114.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.114.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.115.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.115.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.115.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.116.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.116.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.116.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.117.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.117.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.117.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.118.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.118.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.118.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.119.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.119.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.119.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.12.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.12.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.12.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.120.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.120.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.120.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.121.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.121.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.121.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.122.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.122.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.122.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.123.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.123.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.123.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.124.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.124.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.124.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.125.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.125.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.125.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.126.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.126.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.126.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.127.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.127.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.127.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.128.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.128.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.128.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.129.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.129.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.129.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.13.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.13.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.13.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.130.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.130.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.130.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.131.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.131.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.131.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.132.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.132.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.132.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.133.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.133.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.133.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.134.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.134.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.134.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.135.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.135.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.135.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.136.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.136.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.136.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.137.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.137.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.137.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.138.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.138.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.138.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.139.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.139.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.139.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.14.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.14.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.14.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.140.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.140.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.140.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.141.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.141.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.141.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.142.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.142.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.142.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.143.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.143.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.143.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.144.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.144.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.144.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.145.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.145.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.145.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.146.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.146.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.146.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.147.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.147.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.147.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.148.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.148.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.148.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.149.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.149.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.149.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.15.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.15.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.15.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.150.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.150.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.150.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.151.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.151.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.151.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.152.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.152.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.152.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.153.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.153.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.153.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.154.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.154.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.154.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.155.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.155.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.155.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.156.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.156.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.156.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.157.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.157.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.157.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.158.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.158.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.158.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.159.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.159.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.159.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.16.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.16.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.16.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.160.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.160.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.160.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.161.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.161.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.161.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.162.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.162.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.162.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.163.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.163.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.163.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.164.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.164.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.164.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.165.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.165.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.165.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.166.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.166.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.166.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.167.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.167.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.167.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.168.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.168.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.168.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.169.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.169.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.169.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.17.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.17.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.17.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.170.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.170.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.170.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.171.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.171.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.171.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.172.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.172.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.172.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.173.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.173.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.173.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.174.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.174.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.174.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.175.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.175.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.175.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.176.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.176.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.176.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.177.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.177.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.177.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.178.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.178.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.178.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.179.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.179.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.179.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.18.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.18.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.18.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.180.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.180.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.180.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.181.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.181.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.181.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.182.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.182.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.182.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.183.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.183.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.183.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.184.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.184.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.184.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.185.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.185.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.185.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.186.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.186.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.186.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.187.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.187.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.187.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.188.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.188.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.188.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.189.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.189.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.189.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.19.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.19.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.19.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.190.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.190.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.190.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.191.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.191.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.191.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.192.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.192.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.192.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.193.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.193.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.193.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.194.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.194.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.194.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.195.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.195.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.195.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.196.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.196.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.196.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.197.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.197.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.197.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.198.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.198.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.198.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.199.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.199.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.199.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.2.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.2.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.2.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.20.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.20.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.20.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.200.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.200.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.200.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.201.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.201.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.201.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.202.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.202.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.202.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.203.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.203.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.203.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.204.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.204.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.204.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.205.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.205.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.205.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.206.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.206.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.206.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.207.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.207.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.207.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.208.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.208.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.208.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.209.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.209.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.209.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.21.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.21.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.21.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.210.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.210.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.210.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.211.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.211.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.211.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.212.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.212.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.212.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.213.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.213.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.213.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.214.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.214.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.214.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.215.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.215.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.215.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.216.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.216.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.216.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.217.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.217.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.217.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.218.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.218.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.218.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.219.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.219.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.219.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.22.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.22.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.22.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.220.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.220.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.220.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.221.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.221.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.221.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.222.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.222.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.222.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.223.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.223.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.223.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.224.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.224.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.224.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.225.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.225.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.225.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.226.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.226.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.226.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.227.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.227.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.227.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.228.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.228.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.228.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.229.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.229.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.229.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.23.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.23.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.23.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.230.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.230.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.230.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.231.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.231.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.231.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.232.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.232.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.232.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.233.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.233.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.233.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.234.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.234.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.234.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.235.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.235.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.235.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.236.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.236.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.236.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.237.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.237.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.237.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.238.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.238.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.238.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.239.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.239.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.239.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.24.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.24.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.24.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.240.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.240.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.240.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.241.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.241.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.241.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.242.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.242.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.242.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.243.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.243.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.243.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.244.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.244.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.244.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.245.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.245.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.245.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.246.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.246.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.246.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.247.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.247.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.247.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.248.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.248.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.248.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.249.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.249.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.249.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.25.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.25.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.25.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.250.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.250.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.250.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.251.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.251.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.251.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.252.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.252.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.252.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.253.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.253.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.253.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.254.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.254.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.254.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.255.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.255.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.255.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.26.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.26.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.26.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.27.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.27.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.27.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.28.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.28.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.28.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.29.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.29.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.29.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.3.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.3.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.3.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.30.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.30.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.30.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.31.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.31.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.31.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.32.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.32.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.32.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.33.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.33.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.33.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.34.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.34.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.34.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.35.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.35.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.35.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.36.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.36.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.36.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.37.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.37.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.37.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.38.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.38.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.38.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.39.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.39.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.39.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.4.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.4.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.4.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.40.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.40.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.40.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.41.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.41.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.41.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.42.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.42.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.42.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.43.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.43.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.43.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.44.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.44.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.44.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.45.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.45.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.45.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.46.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.46.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.46.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.47.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.47.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.47.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.48.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.48.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.48.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.49.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.49.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.49.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.5.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.5.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.5.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.50.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.50.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.50.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.51.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.51.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.51.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.52.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.52.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.52.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.53.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.53.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.53.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.54.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.54.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.54.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.55.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.55.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.55.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.56.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.56.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.56.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.57.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.57.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.57.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.58.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.58.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.58.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.59.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.59.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.59.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.6.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.6.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.6.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.60.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.60.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.60.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.61.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.61.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.61.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.62.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.62.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.62.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.63.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.63.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.63.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.64.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.64.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.64.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.65.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.65.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.65.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.66.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.66.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.66.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.67.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.67.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.67.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.68.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.68.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.68.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.69.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.69.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.69.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.7.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.7.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.7.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.70.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.70.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.70.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.71.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.71.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.71.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.72.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.72.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.72.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.73.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.73.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.73.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.74.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.74.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.74.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.75.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.75.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.75.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.76.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.76.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.76.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.77.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.77.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.77.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.78.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.78.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.78.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.79.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.79.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.79.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.8.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.8.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.8.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.80.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.80.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.80.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.81.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.81.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.81.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.82.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.82.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.82.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.83.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.83.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.83.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.84.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.84.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.84.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.85.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.85.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.85.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.86.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.86.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.86.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.87.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.87.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.87.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.88.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.88.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.88.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.89.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.89.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.89.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.9.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.9.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.9.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.90.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.90.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.90.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.91.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.91.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.91.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.92.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.92.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.92.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.93.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.93.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.93.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.94.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.94.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.94.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.95.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.95.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.95.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.96.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.96.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.96.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.97.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.97.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.97.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.98.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.98.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.98.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.99.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.99.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.down_proj_list.99.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.0.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.0.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.0.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.1.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.1.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.1.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.10.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.10.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.10.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.100.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.100.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.100.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.101.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.101.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.101.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.102.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.102.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.102.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.103.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.103.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.103.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.104.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.104.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.104.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.105.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.105.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.105.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.106.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.106.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.106.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.107.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.107.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.107.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.108.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.108.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.108.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.109.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.109.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.109.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.11.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.11.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.11.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.110.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.110.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.110.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.111.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.111.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.111.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.112.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.112.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.112.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.113.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.113.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.113.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.114.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.114.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.114.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.115.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.115.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.115.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.116.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.116.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.116.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.117.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.117.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.117.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.118.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.118.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.118.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.119.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.119.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.119.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.12.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.12.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.12.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.120.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.120.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.120.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.121.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.121.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.121.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.122.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.122.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.122.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.123.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.123.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.123.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.124.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.124.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.124.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.125.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.125.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.125.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.126.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.126.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.126.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.127.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.127.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.127.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.128.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.128.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.128.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.129.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.129.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.129.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.13.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.13.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.13.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.130.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.130.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.130.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.131.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.131.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.131.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.132.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.132.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.132.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.133.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.133.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.133.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.134.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.134.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.134.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.135.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.135.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.135.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.136.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.136.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.136.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.137.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.137.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.137.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.138.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.138.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.138.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.139.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.139.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.139.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.14.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.14.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.14.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.140.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.140.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.140.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.141.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.141.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.141.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.142.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.142.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.142.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.143.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.143.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.143.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.144.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.144.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.144.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.145.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.145.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.145.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.146.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.146.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.146.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.147.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.147.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.147.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.148.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.148.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.148.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.149.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.149.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.149.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.15.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.15.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.15.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.150.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.150.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.150.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.151.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.151.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.151.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.152.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.152.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.152.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.153.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.153.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.153.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.154.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.154.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.154.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.155.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.155.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.155.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.156.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.156.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.156.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.157.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.157.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.157.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.158.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.158.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.158.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.159.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.159.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.159.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.16.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.16.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.16.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.160.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.160.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.160.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.161.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.161.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.161.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.162.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.162.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.162.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.163.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.163.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.163.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.164.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.164.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.164.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.165.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.165.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.165.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.166.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.166.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.166.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.167.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.167.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.167.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.168.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.168.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.168.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.169.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.169.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.169.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.17.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.17.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.17.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.170.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.170.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.170.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.171.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.171.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.171.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.172.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.172.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.172.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.173.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.173.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.173.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.174.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.174.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.174.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.175.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.175.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.175.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.176.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.176.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.176.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.177.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.177.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.177.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.178.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.178.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.178.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.179.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.179.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.179.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.18.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.18.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.18.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.180.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.180.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.180.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.181.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.181.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.181.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.182.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.182.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.182.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.183.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.183.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.183.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.184.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.184.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.184.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.185.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.185.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.185.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.186.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.186.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.186.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.187.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.187.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.187.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.188.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.188.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.188.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.189.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.189.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.189.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.19.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.19.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.19.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.190.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.190.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.190.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.191.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.191.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.191.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.192.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.192.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.192.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.193.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.193.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.193.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.194.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.194.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.194.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.195.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.195.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.195.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.196.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.196.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.196.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.197.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.197.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.197.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.198.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.198.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.198.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.199.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.199.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.199.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.2.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.2.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.2.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.20.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.20.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.20.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.200.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.200.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.200.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.201.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.201.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.201.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.202.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.202.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.202.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.203.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.203.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.203.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.204.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.204.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.204.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.205.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.205.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.205.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.206.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.206.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.206.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.207.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.207.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.207.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.208.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.208.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.208.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.209.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.209.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.209.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.21.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.21.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.21.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.210.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.210.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.210.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.211.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.211.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.211.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.212.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.212.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.212.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.213.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.213.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.213.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.214.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.214.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.214.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.215.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.215.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.215.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.216.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.216.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.216.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.217.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.217.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.217.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.218.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.218.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.218.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.219.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.219.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.219.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.22.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.22.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.22.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.220.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.220.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.220.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.221.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.221.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.221.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.222.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.222.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.222.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.223.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.223.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.223.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.224.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.224.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.224.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.225.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.225.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.225.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.226.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.226.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.226.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.227.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.227.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.227.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.228.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.228.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.228.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.229.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.229.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.229.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.23.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.23.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.23.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.230.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.230.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.230.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.231.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.231.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.231.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.232.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.232.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.232.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.233.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.233.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.233.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.234.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.234.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.234.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.235.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.235.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.235.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.236.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.236.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.236.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.237.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.237.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.237.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.238.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.238.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.238.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.239.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.239.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.239.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.24.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.24.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.24.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.240.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.240.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.240.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.241.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.241.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.241.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.242.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.242.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.242.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.243.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.243.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.243.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.244.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.244.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.244.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.245.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.245.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.245.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.246.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.246.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.246.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.247.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.247.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.247.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.248.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.248.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.248.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.249.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.249.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.249.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.25.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.25.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.25.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.250.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.250.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.250.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.251.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.251.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.251.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.252.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.252.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.252.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.253.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.253.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.253.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.254.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.254.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.254.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.255.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.255.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.255.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.26.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.26.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.26.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.27.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.27.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.27.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.28.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.28.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.28.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.29.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.29.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.29.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.3.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.3.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.3.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.30.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.30.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.30.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.31.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.31.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.31.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.32.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.32.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.32.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.33.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.33.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.33.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.34.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.34.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.34.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.35.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.35.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.35.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.36.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.36.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.36.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.37.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.37.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.37.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.38.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.38.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.38.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.39.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.39.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.39.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.4.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.4.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.4.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.40.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.40.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.40.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.41.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.41.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.41.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.42.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.42.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.42.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.43.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.43.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.43.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.44.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.44.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.44.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.45.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.45.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.45.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.46.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.46.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.46.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.47.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.47.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.47.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.48.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.48.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.48.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.49.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.49.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.49.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.5.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.5.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.5.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.50.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.50.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.50.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.51.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.51.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.51.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.52.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.52.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.52.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.53.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.53.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.53.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.54.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.54.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.54.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.55.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.55.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.55.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.56.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.56.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.56.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.57.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.57.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.57.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.58.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.58.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.58.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.59.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.59.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.59.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.6.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.6.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.6.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.60.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.60.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.60.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.61.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.61.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.61.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.62.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.62.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.62.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.63.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.63.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.63.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.64.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.64.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.64.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.65.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.65.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.65.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.66.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.66.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.66.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.67.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.67.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.67.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.68.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.68.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.68.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.69.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.69.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.69.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.7.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.7.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.7.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.70.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.70.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.70.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.71.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.71.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.71.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.72.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.72.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.72.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.73.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.73.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.73.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.74.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.74.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.74.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.75.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.75.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.75.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.76.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.76.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.76.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.77.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.77.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.77.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.78.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.78.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.78.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.79.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.79.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.79.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.8.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.8.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.8.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.80.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.80.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.80.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.81.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.81.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.81.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.82.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.82.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.82.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.83.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.83.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.83.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.84.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.84.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.84.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.85.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.85.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.85.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.86.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.86.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.86.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.87.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.87.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.87.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.88.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.88.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.88.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.89.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.89.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.89.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.9.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.9.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.9.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.90.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.90.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.90.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.91.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.91.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.91.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.92.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.92.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.92.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.93.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.93.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.93.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.94.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.94.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.94.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.95.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.95.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.95.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.96.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.96.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.96.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.97.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.97.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.97.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.98.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.98.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.98.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.99.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.99.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.experts.gate_up_proj_list.99.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.gate.weight": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.shared_expert.down_proj.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.shared_expert.down_proj.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.shared_expert.down_proj.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.shared_expert.gate_proj.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.shared_expert.gate_proj.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.shared_expert.gate_proj.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.shared_expert.up_proj.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.shared_expert.up_proj.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.shared_expert.up_proj.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.shared_expert_gate.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.shared_expert_gate.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.37.mlp.shared_expert_gate.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.37.post_attention_layernorm.weight": "model-00004-of-00004.safetensors", "model.language_model.layers.38.input_layernorm.weight": "model-00004-of-00004.safetensors", "model.language_model.layers.38.linear_attn.A_log": "model-00004-of-00004.safetensors", "model.language_model.layers.38.linear_attn.conv1d.weight": "model-00004-of-00004.safetensors", "model.language_model.layers.38.linear_attn.dt_bias": "model-00004-of-00004.safetensors", "model.language_model.layers.38.linear_attn.in_proj_a.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.linear_attn.in_proj_a.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.linear_attn.in_proj_a.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.linear_attn.in_proj_b.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.linear_attn.in_proj_b.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.linear_attn.in_proj_b.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.linear_attn.in_proj_qkv.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.linear_attn.in_proj_qkv.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.linear_attn.in_proj_qkv.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.linear_attn.in_proj_z.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.linear_attn.in_proj_z.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.linear_attn.in_proj_z.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.linear_attn.norm.weight": "model-00004-of-00004.safetensors", "model.language_model.layers.38.linear_attn.out_proj.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.linear_attn.out_proj.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.linear_attn.out_proj.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.0.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.0.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.0.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.1.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.1.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.1.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.10.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.10.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.10.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.100.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.100.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.100.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.101.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.101.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.101.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.102.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.102.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.102.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.103.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.103.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.103.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.104.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.104.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.104.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.105.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.105.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.105.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.106.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.106.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.106.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.107.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.107.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.107.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.108.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.108.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.108.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.109.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.109.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.109.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.11.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.11.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.11.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.110.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.110.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.110.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.111.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.111.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.111.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.112.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.112.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.112.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.113.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.113.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.113.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.114.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.114.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.114.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.115.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.115.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.115.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.116.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.116.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.116.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.117.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.117.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.117.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.118.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.118.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.118.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.119.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.119.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.119.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.12.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.12.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.12.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.120.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.120.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.120.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.121.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.121.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.121.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.122.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.122.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.122.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.123.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.123.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.123.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.124.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.124.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.124.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.125.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.125.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.125.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.126.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.126.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.126.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.127.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.127.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.127.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.128.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.128.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.128.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.129.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.129.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.129.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.13.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.13.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.13.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.130.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.130.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.130.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.131.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.131.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.131.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.132.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.132.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.132.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.133.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.133.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.133.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.134.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.134.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.134.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.135.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.135.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.135.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.136.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.136.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.136.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.137.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.137.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.137.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.138.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.138.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.138.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.139.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.139.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.139.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.14.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.14.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.14.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.140.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.140.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.140.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.141.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.141.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.141.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.142.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.142.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.142.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.143.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.143.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.143.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.144.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.144.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.144.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.145.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.145.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.145.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.146.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.146.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.146.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.147.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.147.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.147.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.148.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.148.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.148.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.149.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.149.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.149.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.15.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.15.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.15.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.150.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.150.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.150.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.151.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.151.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.151.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.152.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.152.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.152.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.153.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.153.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.153.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.154.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.154.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.154.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.155.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.155.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.155.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.156.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.156.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.156.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.157.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.157.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.157.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.158.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.158.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.158.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.159.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.159.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.159.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.16.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.16.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.16.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.160.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.160.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.160.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.161.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.161.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.161.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.162.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.162.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.162.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.163.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.163.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.163.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.164.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.164.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.164.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.165.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.165.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.165.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.166.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.166.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.166.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.167.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.167.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.167.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.168.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.168.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.168.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.169.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.169.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.169.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.17.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.17.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.17.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.170.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.170.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.170.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.171.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.171.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.171.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.172.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.172.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.172.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.173.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.173.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.173.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.174.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.174.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.174.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.175.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.175.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.175.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.176.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.176.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.176.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.177.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.177.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.177.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.178.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.178.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.178.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.179.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.179.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.179.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.18.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.18.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.18.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.180.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.180.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.180.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.181.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.181.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.181.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.182.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.182.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.182.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.183.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.183.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.183.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.184.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.184.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.184.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.185.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.185.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.185.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.186.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.186.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.186.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.187.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.187.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.187.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.188.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.188.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.188.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.189.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.189.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.189.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.19.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.19.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.19.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.190.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.190.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.190.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.191.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.191.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.191.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.192.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.192.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.192.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.193.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.193.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.193.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.194.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.194.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.194.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.195.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.195.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.195.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.196.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.196.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.196.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.197.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.197.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.197.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.198.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.198.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.198.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.199.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.199.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.199.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.2.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.2.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.2.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.20.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.20.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.20.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.200.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.200.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.200.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.201.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.201.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.201.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.202.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.202.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.202.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.203.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.203.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.203.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.204.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.204.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.204.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.205.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.205.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.205.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.206.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.206.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.206.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.207.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.207.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.207.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.208.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.208.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.208.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.209.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.209.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.209.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.21.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.21.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.21.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.210.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.210.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.210.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.211.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.211.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.211.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.212.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.212.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.212.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.213.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.213.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.213.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.214.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.214.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.214.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.215.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.215.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.215.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.216.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.216.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.216.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.217.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.217.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.217.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.218.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.218.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.218.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.219.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.219.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.219.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.22.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.22.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.22.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.220.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.220.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.220.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.221.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.221.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.221.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.222.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.222.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.222.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.223.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.223.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.223.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.224.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.224.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.224.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.225.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.225.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.225.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.226.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.226.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.226.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.227.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.227.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.227.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.228.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.228.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.228.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.229.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.229.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.229.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.23.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.23.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.23.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.230.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.230.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.230.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.231.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.231.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.231.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.232.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.232.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.232.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.233.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.233.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.233.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.234.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.234.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.234.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.235.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.235.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.235.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.236.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.236.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.236.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.237.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.237.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.237.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.238.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.238.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.238.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.239.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.239.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.239.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.24.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.24.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.24.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.240.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.240.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.240.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.241.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.241.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.241.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.242.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.242.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.242.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.243.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.243.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.243.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.244.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.244.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.244.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.245.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.245.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.245.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.246.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.246.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.246.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.247.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.247.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.247.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.248.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.248.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.248.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.249.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.249.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.249.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.25.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.25.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.25.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.250.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.250.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.250.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.251.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.251.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.251.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.252.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.252.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.252.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.253.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.253.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.253.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.254.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.254.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.254.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.255.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.255.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.255.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.26.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.26.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.26.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.27.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.27.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.27.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.28.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.28.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.28.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.29.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.29.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.29.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.3.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.3.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.3.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.30.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.30.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.30.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.31.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.31.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.31.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.32.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.32.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.32.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.33.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.33.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.33.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.34.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.34.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.34.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.35.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.35.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.35.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.36.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.36.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.36.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.37.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.37.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.37.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.38.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.38.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.38.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.39.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.39.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.39.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.4.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.4.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.4.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.40.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.40.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.40.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.41.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.41.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.41.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.42.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.42.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.42.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.43.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.43.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.43.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.44.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.44.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.44.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.45.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.45.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.45.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.46.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.46.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.46.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.47.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.47.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.47.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.48.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.48.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.48.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.49.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.49.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.49.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.5.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.5.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.5.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.50.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.50.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.50.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.51.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.51.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.51.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.52.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.52.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.52.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.53.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.53.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.53.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.54.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.54.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.54.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.55.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.55.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.55.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.56.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.56.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.56.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.57.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.57.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.57.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.58.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.58.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.58.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.59.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.59.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.59.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.6.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.6.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.6.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.60.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.60.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.60.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.61.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.61.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.61.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.62.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.62.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.62.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.63.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.63.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.63.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.64.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.64.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.64.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.65.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.65.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.65.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.66.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.66.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.66.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.67.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.67.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.67.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.68.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.68.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.68.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.69.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.69.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.69.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.7.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.7.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.7.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.70.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.70.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.70.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.71.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.71.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.71.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.72.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.72.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.72.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.73.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.73.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.73.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.74.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.74.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.74.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.75.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.75.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.75.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.76.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.76.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.76.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.77.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.77.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.77.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.78.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.78.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.78.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.79.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.79.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.79.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.8.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.8.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.8.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.80.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.80.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.80.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.81.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.81.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.81.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.82.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.82.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.82.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.83.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.83.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.83.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.84.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.84.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.84.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.85.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.85.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.85.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.86.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.86.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.86.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.87.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.87.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.87.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.88.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.88.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.88.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.89.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.89.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.89.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.9.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.9.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.9.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.90.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.90.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.90.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.91.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.91.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.91.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.92.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.92.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.92.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.93.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.93.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.93.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.94.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.94.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.94.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.95.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.95.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.95.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.96.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.96.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.96.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.97.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.97.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.97.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.98.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.98.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.98.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.99.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.99.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.down_proj_list.99.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.0.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.0.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.0.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.1.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.1.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.1.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.10.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.10.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.10.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.100.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.100.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.100.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.101.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.101.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.101.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.102.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.102.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.102.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.103.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.103.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.103.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.104.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.104.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.104.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.105.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.105.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.105.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.106.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.106.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.106.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.107.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.107.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.107.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.108.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.108.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.108.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.109.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.109.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.109.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.11.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.11.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.11.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.110.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.110.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.110.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.111.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.111.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.111.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.112.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.112.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.112.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.113.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.113.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.113.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.114.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.114.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.114.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.115.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.115.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.115.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.116.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.116.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.116.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.117.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.117.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.117.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.118.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.118.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.118.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.119.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.119.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.119.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.12.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.12.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.12.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.120.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.120.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.120.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.121.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.121.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.121.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.122.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.122.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.122.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.123.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.123.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.123.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.124.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.124.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.124.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.125.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.125.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.125.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.126.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.126.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.126.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.127.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.127.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.127.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.128.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.128.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.128.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.129.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.129.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.129.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.13.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.13.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.13.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.130.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.130.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.130.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.131.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.131.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.131.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.132.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.132.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.132.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.133.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.133.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.133.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.134.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.134.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.134.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.135.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.135.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.135.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.136.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.136.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.136.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.137.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.137.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.137.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.138.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.138.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.138.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.139.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.139.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.139.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.14.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.14.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.14.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.140.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.140.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.140.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.141.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.141.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.141.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.142.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.142.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.142.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.143.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.143.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.143.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.144.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.144.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.144.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.145.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.145.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.145.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.146.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.146.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.146.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.147.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.147.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.147.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.148.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.148.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.148.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.149.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.149.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.149.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.15.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.15.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.15.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.150.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.150.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.150.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.151.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.151.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.151.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.152.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.152.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.152.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.153.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.153.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.153.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.154.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.154.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.154.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.155.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.155.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.155.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.156.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.156.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.156.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.157.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.157.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.157.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.158.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.158.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.158.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.159.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.159.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.159.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.16.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.16.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.16.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.160.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.160.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.160.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.161.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.161.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.161.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.162.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.162.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.162.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.163.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.163.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.163.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.164.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.164.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.164.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.165.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.165.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.165.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.166.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.166.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.166.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.167.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.167.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.167.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.168.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.168.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.168.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.169.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.169.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.169.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.17.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.17.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.17.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.170.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.170.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.170.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.171.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.171.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.171.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.172.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.172.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.172.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.173.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.173.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.173.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.174.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.174.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.174.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.175.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.175.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.175.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.176.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.176.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.176.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.177.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.177.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.177.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.178.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.178.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.178.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.179.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.179.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.179.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.18.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.18.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.18.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.180.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.180.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.180.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.181.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.181.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.181.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.182.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.182.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.182.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.183.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.183.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.183.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.184.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.184.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.184.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.185.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.185.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.185.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.186.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.186.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.186.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.187.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.187.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.187.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.188.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.188.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.188.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.189.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.189.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.189.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.19.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.19.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.19.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.190.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.190.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.190.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.191.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.191.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.191.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.192.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.192.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.192.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.193.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.193.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.193.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.194.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.194.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.194.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.195.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.195.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.195.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.196.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.196.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.196.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.197.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.197.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.197.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.198.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.198.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.198.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.199.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.199.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.199.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.2.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.2.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.2.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.20.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.20.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.20.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.200.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.200.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.200.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.201.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.201.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.201.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.202.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.202.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.202.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.203.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.203.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.203.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.204.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.204.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.204.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.205.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.205.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.205.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.206.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.206.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.206.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.207.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.207.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.207.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.208.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.208.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.208.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.209.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.209.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.209.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.21.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.21.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.21.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.210.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.210.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.210.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.211.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.211.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.211.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.212.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.212.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.212.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.213.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.213.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.213.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.214.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.214.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.214.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.215.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.215.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.215.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.216.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.216.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.216.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.217.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.217.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.217.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.218.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.218.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.218.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.219.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.219.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.219.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.22.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.22.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.22.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.220.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.220.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.220.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.221.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.221.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.221.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.222.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.222.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.222.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.223.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.223.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.223.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.224.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.224.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.224.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.225.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.225.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.225.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.226.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.226.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.226.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.227.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.227.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.227.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.228.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.228.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.228.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.229.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.229.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.229.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.23.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.23.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.23.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.230.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.230.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.230.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.231.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.231.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.231.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.232.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.232.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.232.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.233.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.233.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.233.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.234.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.234.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.234.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.235.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.235.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.235.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.236.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.236.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.236.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.237.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.237.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.237.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.238.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.238.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.238.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.239.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.239.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.239.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.24.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.24.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.24.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.240.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.240.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.240.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.241.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.241.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.241.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.242.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.242.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.242.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.243.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.243.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.243.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.244.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.244.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.244.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.245.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.245.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.245.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.246.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.246.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.246.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.247.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.247.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.247.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.248.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.248.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.248.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.249.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.249.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.249.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.25.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.25.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.25.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.250.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.250.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.250.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.251.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.251.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.251.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.252.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.252.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.252.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.253.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.253.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.253.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.254.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.254.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.254.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.255.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.255.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.255.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.26.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.26.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.26.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.27.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.27.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.27.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.28.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.28.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.28.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.29.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.29.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.29.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.3.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.3.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.3.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.30.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.30.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.30.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.31.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.31.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.31.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.32.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.32.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.32.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.33.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.33.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.33.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.34.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.34.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.34.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.35.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.35.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.35.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.36.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.36.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.36.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.37.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.37.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.37.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.38.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.38.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.38.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.39.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.39.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.39.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.4.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.4.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.4.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.40.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.40.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.40.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.41.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.41.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.41.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.42.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.42.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.42.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.43.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.43.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.43.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.44.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.44.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.44.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.45.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.45.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.45.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.46.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.46.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.46.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.47.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.47.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.47.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.48.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.48.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.48.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.49.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.49.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.49.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.5.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.5.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.5.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.50.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.50.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.50.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.51.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.51.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.51.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.52.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.52.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.52.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.53.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.53.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.53.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.54.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.54.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.54.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.55.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.55.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.55.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.56.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.56.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.56.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.57.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.57.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.57.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.58.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.58.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.58.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.59.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.59.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.59.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.6.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.6.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.6.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.60.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.60.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.60.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.61.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.61.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.61.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.62.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.62.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.62.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.63.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.63.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.63.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.64.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.64.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.64.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.65.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.65.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.65.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.66.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.66.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.66.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.67.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.67.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.67.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.68.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.68.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.68.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.69.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.69.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.69.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.7.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.7.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.7.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.70.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.70.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.70.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.71.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.71.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.71.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.72.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.72.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.72.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.73.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.73.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.73.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.74.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.74.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.74.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.75.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.75.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.75.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.76.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.76.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.76.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.77.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.77.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.77.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.78.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.78.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.78.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.79.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.79.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.79.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.8.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.8.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.8.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.80.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.80.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.80.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.81.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.81.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.81.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.82.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.82.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.82.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.83.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.83.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.83.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.84.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.84.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.84.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.85.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.85.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.85.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.86.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.86.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.86.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.87.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.87.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.87.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.88.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.88.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.88.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.89.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.89.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.89.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.9.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.9.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.9.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.90.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.90.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.90.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.91.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.91.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.91.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.92.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.92.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.92.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.93.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.93.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.93.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.94.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.94.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.94.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.95.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.95.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.95.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.96.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.96.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.96.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.97.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.97.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.97.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.98.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.98.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.98.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.99.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.99.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.experts.gate_up_proj_list.99.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.gate.weight": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.shared_expert.down_proj.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.shared_expert.down_proj.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.shared_expert.down_proj.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.shared_expert.gate_proj.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.shared_expert.gate_proj.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.shared_expert.gate_proj.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.shared_expert.up_proj.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.shared_expert.up_proj.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.shared_expert.up_proj.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.shared_expert_gate.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.shared_expert_gate.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.38.mlp.shared_expert_gate.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.38.post_attention_layernorm.weight": "model-00004-of-00004.safetensors", "model.language_model.layers.39.input_layernorm.weight": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.0.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.0.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.0.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.1.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.1.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.1.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.10.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.10.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.10.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.100.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.100.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.100.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.101.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.101.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.101.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.102.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.102.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.102.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.103.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.103.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.103.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.104.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.104.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.104.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.105.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.105.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.105.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.106.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.106.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.106.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.107.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.107.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.107.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.108.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.108.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.108.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.109.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.109.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.109.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.11.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.11.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.11.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.110.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.110.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.110.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.111.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.111.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.111.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.112.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.112.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.112.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.113.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.113.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.113.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.114.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.114.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.114.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.115.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.115.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.115.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.116.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.116.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.116.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.117.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.117.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.117.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.118.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.118.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.118.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.119.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.119.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.119.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.12.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.12.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.12.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.120.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.120.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.120.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.121.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.121.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.121.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.122.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.122.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.122.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.123.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.123.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.123.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.124.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.124.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.124.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.125.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.125.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.125.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.126.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.126.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.126.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.127.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.127.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.127.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.128.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.128.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.128.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.129.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.129.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.129.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.13.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.13.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.13.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.130.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.130.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.130.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.131.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.131.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.131.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.132.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.132.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.132.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.133.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.133.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.133.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.134.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.134.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.134.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.135.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.135.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.135.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.136.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.136.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.136.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.137.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.137.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.137.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.138.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.138.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.138.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.139.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.139.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.139.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.14.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.14.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.14.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.140.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.140.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.140.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.141.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.141.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.141.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.142.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.142.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.142.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.143.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.143.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.143.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.144.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.144.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.144.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.145.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.145.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.145.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.146.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.146.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.146.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.147.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.147.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.147.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.148.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.148.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.148.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.149.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.149.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.149.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.15.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.15.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.15.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.150.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.150.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.150.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.151.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.151.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.151.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.152.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.152.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.152.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.153.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.153.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.153.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.154.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.154.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.154.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.155.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.155.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.155.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.156.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.156.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.156.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.157.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.157.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.157.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.158.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.158.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.158.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.159.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.159.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.159.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.16.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.16.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.16.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.160.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.160.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.160.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.161.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.161.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.161.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.162.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.162.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.162.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.163.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.163.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.163.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.164.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.164.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.164.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.165.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.165.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.165.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.166.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.166.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.166.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.167.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.167.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.167.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.168.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.168.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.168.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.169.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.169.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.169.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.17.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.17.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.17.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.170.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.170.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.170.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.171.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.171.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.171.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.172.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.172.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.172.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.173.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.173.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.173.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.174.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.174.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.174.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.175.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.175.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.175.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.176.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.176.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.176.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.177.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.177.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.177.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.178.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.178.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.178.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.179.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.179.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.179.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.18.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.18.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.18.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.180.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.180.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.180.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.181.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.181.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.181.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.182.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.182.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.182.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.183.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.183.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.183.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.184.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.184.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.184.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.185.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.185.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.185.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.186.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.186.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.186.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.187.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.187.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.187.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.188.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.188.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.188.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.189.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.189.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.189.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.19.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.19.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.19.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.190.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.190.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.190.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.191.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.191.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.191.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.192.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.192.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.192.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.193.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.193.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.193.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.194.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.194.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.194.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.195.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.195.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.195.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.196.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.196.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.196.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.197.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.197.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.197.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.198.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.198.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.198.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.199.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.199.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.199.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.2.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.2.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.2.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.20.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.20.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.20.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.200.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.200.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.200.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.201.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.201.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.201.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.202.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.202.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.202.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.203.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.203.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.203.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.204.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.204.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.204.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.205.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.205.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.205.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.206.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.206.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.206.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.207.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.207.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.207.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.208.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.208.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.208.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.209.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.209.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.209.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.21.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.21.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.21.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.210.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.210.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.210.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.211.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.211.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.211.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.212.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.212.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.212.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.213.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.213.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.213.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.214.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.214.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.214.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.215.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.215.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.215.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.216.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.216.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.216.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.217.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.217.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.217.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.218.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.218.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.218.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.219.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.219.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.219.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.22.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.22.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.22.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.220.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.220.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.220.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.221.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.221.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.221.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.222.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.222.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.222.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.223.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.223.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.223.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.224.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.224.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.224.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.225.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.225.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.225.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.226.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.226.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.226.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.227.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.227.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.227.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.228.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.228.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.228.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.229.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.229.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.229.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.23.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.23.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.23.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.230.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.230.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.230.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.231.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.231.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.231.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.232.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.232.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.232.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.233.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.233.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.233.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.234.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.234.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.234.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.235.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.235.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.235.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.236.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.236.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.236.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.237.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.237.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.237.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.238.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.238.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.238.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.239.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.239.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.239.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.24.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.24.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.24.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.240.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.240.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.240.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.241.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.241.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.241.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.242.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.242.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.242.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.243.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.243.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.243.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.244.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.244.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.244.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.245.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.245.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.245.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.246.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.246.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.246.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.247.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.247.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.247.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.248.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.248.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.248.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.249.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.249.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.249.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.25.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.25.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.25.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.250.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.250.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.250.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.251.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.251.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.251.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.252.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.252.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.252.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.253.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.253.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.253.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.254.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.254.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.254.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.255.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.255.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.255.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.26.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.26.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.26.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.27.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.27.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.27.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.28.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.28.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.28.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.29.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.29.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.29.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.3.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.3.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.3.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.30.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.30.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.30.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.31.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.31.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.31.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.32.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.32.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.32.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.33.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.33.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.33.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.34.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.34.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.34.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.35.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.35.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.35.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.36.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.36.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.36.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.37.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.37.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.37.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.38.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.38.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.38.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.39.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.39.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.39.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.4.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.4.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.4.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.40.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.40.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.40.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.41.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.41.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.41.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.42.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.42.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.42.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.43.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.43.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.43.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.44.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.44.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.44.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.45.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.45.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.45.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.46.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.46.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.46.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.47.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.47.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.47.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.48.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.48.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.48.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.49.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.49.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.49.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.5.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.5.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.5.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.50.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.50.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.50.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.51.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.51.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.51.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.52.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.52.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.52.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.53.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.53.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.53.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.54.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.54.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.54.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.55.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.55.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.55.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.56.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.56.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.56.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.57.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.57.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.57.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.58.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.58.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.58.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.59.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.59.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.59.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.6.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.6.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.6.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.60.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.60.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.60.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.61.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.61.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.61.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.62.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.62.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.62.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.63.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.63.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.63.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.64.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.64.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.64.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.65.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.65.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.65.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.66.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.66.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.66.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.67.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.67.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.67.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.68.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.68.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.68.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.69.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.69.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.69.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.7.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.7.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.7.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.70.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.70.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.70.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.71.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.71.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.71.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.72.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.72.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.72.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.73.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.73.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.73.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.74.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.74.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.74.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.75.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.75.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.75.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.76.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.76.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.76.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.77.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.77.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.77.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.78.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.78.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.78.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.79.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.79.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.79.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.8.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.8.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.8.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.80.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.80.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.80.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.81.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.81.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.81.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.82.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.82.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.82.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.83.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.83.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.83.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.84.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.84.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.84.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.85.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.85.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.85.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.86.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.86.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.86.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.87.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.87.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.87.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.88.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.88.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.88.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.89.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.89.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.89.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.9.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.9.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.9.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.90.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.90.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.90.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.91.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.91.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.91.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.92.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.92.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.92.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.93.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.93.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.93.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.94.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.94.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.94.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.95.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.95.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.95.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.96.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.96.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.96.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.97.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.97.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.97.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.98.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.98.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.98.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.99.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.99.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.down_proj_list.99.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.0.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.0.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.0.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.1.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.1.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.1.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.10.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.10.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.10.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.100.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.100.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.100.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.101.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.101.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.101.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.102.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.102.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.102.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.103.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.103.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.103.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.104.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.104.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.104.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.105.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.105.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.105.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.106.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.106.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.106.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.107.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.107.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.107.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.108.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.108.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.108.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.109.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.109.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.109.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.11.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.11.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.11.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.110.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.110.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.110.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.111.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.111.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.111.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.112.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.112.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.112.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.113.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.113.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.113.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.114.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.114.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.114.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.115.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.115.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.115.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.116.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.116.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.116.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.117.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.117.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.117.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.118.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.118.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.118.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.119.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.119.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.119.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.12.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.12.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.12.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.120.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.120.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.120.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.121.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.121.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.121.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.122.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.122.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.122.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.123.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.123.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.123.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.124.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.124.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.124.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.125.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.125.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.125.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.126.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.126.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.126.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.127.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.127.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.127.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.128.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.128.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.128.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.129.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.129.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.129.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.13.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.13.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.13.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.130.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.130.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.130.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.131.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.131.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.131.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.132.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.132.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.132.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.133.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.133.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.133.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.134.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.134.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.134.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.135.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.135.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.135.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.136.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.136.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.136.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.137.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.137.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.137.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.138.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.138.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.138.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.139.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.139.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.139.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.14.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.14.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.14.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.140.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.140.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.140.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.141.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.141.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.141.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.142.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.142.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.142.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.143.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.143.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.143.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.144.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.144.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.144.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.145.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.145.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.145.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.146.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.146.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.146.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.147.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.147.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.147.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.148.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.148.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.148.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.149.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.149.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.149.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.15.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.15.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.15.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.150.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.150.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.150.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.151.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.151.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.151.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.152.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.152.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.152.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.153.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.153.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.153.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.154.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.154.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.154.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.155.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.155.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.155.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.156.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.156.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.156.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.157.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.157.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.157.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.158.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.158.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.158.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.159.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.159.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.159.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.16.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.16.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.16.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.160.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.160.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.160.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.161.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.161.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.161.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.162.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.162.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.162.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.163.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.163.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.163.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.164.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.164.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.164.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.165.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.165.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.165.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.166.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.166.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.166.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.167.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.167.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.167.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.168.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.168.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.168.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.169.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.169.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.169.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.17.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.17.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.17.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.170.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.170.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.170.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.171.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.171.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.171.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.172.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.172.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.172.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.173.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.173.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.173.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.174.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.174.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.174.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.175.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.175.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.175.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.176.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.176.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.176.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.177.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.177.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.177.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.178.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.178.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.178.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.179.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.179.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.179.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.18.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.18.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.18.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.180.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.180.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.180.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.181.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.181.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.181.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.182.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.182.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.182.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.183.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.183.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.183.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.184.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.184.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.184.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.185.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.185.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.185.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.186.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.186.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.186.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.187.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.187.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.187.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.188.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.188.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.188.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.189.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.189.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.189.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.19.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.19.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.19.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.190.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.190.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.190.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.191.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.191.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.191.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.192.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.192.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.192.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.193.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.193.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.193.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.194.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.194.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.194.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.195.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.195.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.195.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.196.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.196.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.196.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.197.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.197.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.197.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.198.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.198.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.198.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.199.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.199.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.199.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.2.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.2.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.2.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.20.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.20.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.20.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.200.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.200.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.200.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.201.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.201.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.201.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.202.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.202.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.202.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.203.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.203.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.203.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.204.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.204.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.204.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.205.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.205.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.205.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.206.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.206.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.206.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.207.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.207.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.207.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.208.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.208.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.208.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.209.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.209.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.209.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.21.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.21.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.21.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.210.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.210.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.210.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.211.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.211.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.211.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.212.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.212.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.212.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.213.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.213.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.213.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.214.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.214.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.214.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.215.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.215.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.215.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.216.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.216.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.216.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.217.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.217.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.217.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.218.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.218.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.218.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.219.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.219.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.219.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.22.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.22.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.22.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.220.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.220.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.220.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.221.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.221.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.221.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.222.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.222.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.222.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.223.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.223.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.223.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.224.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.224.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.224.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.225.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.225.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.225.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.226.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.226.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.226.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.227.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.227.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.227.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.228.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.228.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.228.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.229.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.229.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.229.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.23.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.23.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.23.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.230.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.230.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.230.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.231.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.231.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.231.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.232.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.232.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.232.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.233.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.233.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.233.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.234.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.234.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.234.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.235.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.235.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.235.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.236.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.236.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.236.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.237.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.237.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.237.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.238.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.238.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.238.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.239.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.239.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.239.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.24.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.24.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.24.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.240.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.240.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.240.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.241.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.241.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.241.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.242.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.242.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.242.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.243.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.243.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.243.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.244.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.244.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.244.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.245.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.245.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.245.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.246.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.246.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.246.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.247.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.247.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.247.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.248.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.248.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.248.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.249.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.249.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.249.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.25.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.25.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.25.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.250.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.250.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.250.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.251.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.251.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.251.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.252.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.252.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.252.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.253.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.253.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.253.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.254.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.254.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.254.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.255.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.255.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.255.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.26.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.26.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.26.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.27.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.27.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.27.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.28.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.28.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.28.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.29.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.29.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.29.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.3.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.3.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.3.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.30.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.30.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.30.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.31.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.31.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.31.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.32.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.32.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.32.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.33.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.33.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.33.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.34.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.34.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.34.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.35.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.35.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.35.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.36.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.36.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.36.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.37.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.37.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.37.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.38.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.38.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.38.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.39.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.39.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.39.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.4.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.4.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.4.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.40.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.40.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.40.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.41.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.41.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.41.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.42.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.42.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.42.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.43.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.43.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.43.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.44.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.44.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.44.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.45.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.45.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.45.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.46.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.46.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.46.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.47.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.47.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.47.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.48.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.48.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.48.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.49.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.49.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.49.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.5.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.5.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.5.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.50.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.50.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.50.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.51.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.51.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.51.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.52.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.52.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.52.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.53.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.53.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.53.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.54.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.54.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.54.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.55.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.55.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.55.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.56.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.56.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.56.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.57.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.57.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.57.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.58.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.58.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.58.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.59.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.59.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.59.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.6.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.6.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.6.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.60.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.60.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.60.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.61.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.61.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.61.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.62.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.62.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.62.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.63.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.63.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.63.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.64.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.64.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.64.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.65.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.65.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.65.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.66.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.66.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.66.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.67.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.67.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.67.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.68.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.68.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.68.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.69.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.69.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.69.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.7.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.7.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.7.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.70.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.70.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.70.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.71.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.71.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.71.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.72.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.72.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.72.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.73.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.73.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.73.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.74.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.74.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.74.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.75.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.75.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.75.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.76.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.76.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.76.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.77.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.77.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.77.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.78.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.78.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.78.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.79.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.79.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.79.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.8.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.8.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.8.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.80.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.80.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.80.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.81.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.81.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.81.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.82.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.82.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.82.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.83.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.83.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.83.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.84.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.84.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.84.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.85.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.85.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.85.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.86.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.86.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.86.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.87.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.87.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.87.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.88.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.88.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.88.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.89.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.89.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.89.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.9.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.9.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.9.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.90.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.90.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.90.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.91.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.91.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.91.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.92.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.92.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.92.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.93.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.93.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.93.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.94.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.94.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.94.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.95.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.95.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.95.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.96.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.96.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.96.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.97.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.97.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.97.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.98.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.98.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.98.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.99.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.99.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.experts.gate_up_proj_list.99.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.gate.weight": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.shared_expert.down_proj.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.shared_expert.down_proj.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.shared_expert.down_proj.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.shared_expert.gate_proj.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.shared_expert.gate_proj.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.shared_expert.gate_proj.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.shared_expert.up_proj.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.shared_expert.up_proj.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.shared_expert.up_proj.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.shared_expert_gate.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.shared_expert_gate.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.mlp.shared_expert_gate.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.post_attention_layernorm.weight": "model-00004-of-00004.safetensors", "model.language_model.layers.39.self_attn.k_norm.weight": "model-00004-of-00004.safetensors", "model.language_model.layers.39.self_attn.k_proj.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.self_attn.k_proj.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.self_attn.k_proj.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.self_attn.o_proj.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.self_attn.o_proj.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.self_attn.o_proj.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.self_attn.q_norm.weight": "model-00004-of-00004.safetensors", "model.language_model.layers.39.self_attn.q_proj.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.self_attn.q_proj.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.self_attn.q_proj.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.39.self_attn.v_proj.W_q_packed": "model-00004-of-00004.safetensors", "model.language_model.layers.39.self_attn.v_proj.scale": "model-00004-of-00004.safetensors", "model.language_model.layers.39.self_attn.v_proj.zero": "model-00004-of-00004.safetensors", "model.language_model.layers.4.input_layernorm.weight": "model-00001-of-00004.safetensors", "model.language_model.layers.4.linear_attn.A_log": "model-00001-of-00004.safetensors", "model.language_model.layers.4.linear_attn.conv1d.weight": "model-00001-of-00004.safetensors", "model.language_model.layers.4.linear_attn.dt_bias": "model-00001-of-00004.safetensors", "model.language_model.layers.4.linear_attn.in_proj_a.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.linear_attn.in_proj_a.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.linear_attn.in_proj_a.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.linear_attn.in_proj_b.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.linear_attn.in_proj_b.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.linear_attn.in_proj_b.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.linear_attn.in_proj_qkv.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.linear_attn.in_proj_qkv.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.linear_attn.in_proj_qkv.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.linear_attn.in_proj_z.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.linear_attn.in_proj_z.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.linear_attn.in_proj_z.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.linear_attn.norm.weight": "model-00001-of-00004.safetensors", "model.language_model.layers.4.linear_attn.out_proj.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.linear_attn.out_proj.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.linear_attn.out_proj.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.0.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.0.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.0.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.1.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.1.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.1.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.10.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.10.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.10.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.100.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.100.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.100.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.101.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.101.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.101.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.102.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.102.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.102.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.103.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.103.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.103.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.104.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.104.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.104.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.105.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.105.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.105.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.106.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.106.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.106.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.107.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.107.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.107.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.108.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.108.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.108.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.109.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.109.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.109.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.11.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.11.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.11.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.110.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.110.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.110.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.111.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.111.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.111.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.112.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.112.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.112.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.113.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.113.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.113.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.114.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.114.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.114.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.115.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.115.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.115.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.116.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.116.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.116.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.117.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.117.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.117.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.118.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.118.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.118.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.119.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.119.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.119.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.12.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.12.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.12.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.120.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.120.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.120.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.121.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.121.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.121.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.122.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.122.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.122.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.123.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.123.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.123.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.124.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.124.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.124.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.125.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.125.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.125.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.126.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.126.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.126.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.127.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.127.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.127.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.128.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.128.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.128.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.129.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.129.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.129.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.13.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.13.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.13.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.130.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.130.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.130.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.131.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.131.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.131.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.132.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.132.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.132.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.133.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.133.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.133.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.134.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.134.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.134.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.135.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.135.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.135.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.136.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.136.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.136.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.137.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.137.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.137.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.138.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.138.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.138.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.139.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.139.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.139.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.14.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.14.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.14.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.140.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.140.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.140.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.141.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.141.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.141.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.142.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.142.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.142.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.143.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.143.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.143.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.144.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.144.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.144.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.145.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.145.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.145.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.146.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.146.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.146.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.147.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.147.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.147.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.148.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.148.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.148.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.149.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.149.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.149.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.15.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.15.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.15.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.150.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.150.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.150.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.151.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.151.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.151.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.152.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.152.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.152.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.153.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.153.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.153.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.154.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.154.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.154.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.155.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.155.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.155.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.156.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.156.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.156.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.157.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.157.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.157.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.158.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.158.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.158.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.159.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.159.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.159.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.16.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.16.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.16.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.160.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.160.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.160.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.161.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.161.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.161.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.162.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.162.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.162.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.163.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.163.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.163.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.164.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.164.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.164.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.165.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.165.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.165.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.166.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.166.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.166.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.167.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.167.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.167.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.168.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.168.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.168.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.169.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.169.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.169.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.17.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.17.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.17.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.170.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.170.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.170.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.171.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.171.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.171.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.172.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.172.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.172.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.173.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.173.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.173.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.174.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.174.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.174.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.175.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.175.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.175.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.176.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.176.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.176.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.177.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.177.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.177.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.178.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.178.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.178.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.179.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.179.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.179.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.18.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.18.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.18.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.180.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.180.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.180.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.181.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.181.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.181.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.182.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.182.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.182.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.183.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.183.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.183.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.184.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.184.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.184.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.185.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.185.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.185.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.186.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.186.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.186.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.187.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.187.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.187.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.188.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.188.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.188.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.189.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.189.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.189.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.19.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.19.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.19.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.190.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.190.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.190.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.191.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.191.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.191.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.192.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.192.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.192.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.193.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.193.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.193.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.194.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.194.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.194.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.195.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.195.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.195.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.196.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.196.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.196.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.197.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.197.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.197.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.198.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.198.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.198.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.199.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.199.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.199.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.2.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.2.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.2.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.20.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.20.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.20.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.200.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.200.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.200.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.201.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.201.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.201.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.202.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.202.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.202.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.203.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.203.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.203.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.204.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.204.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.204.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.205.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.205.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.205.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.206.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.206.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.206.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.207.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.207.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.207.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.208.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.208.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.208.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.209.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.209.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.209.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.21.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.21.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.21.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.210.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.210.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.210.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.211.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.211.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.211.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.212.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.212.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.212.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.213.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.213.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.213.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.214.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.214.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.214.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.215.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.215.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.215.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.216.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.216.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.216.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.217.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.217.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.217.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.218.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.218.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.218.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.219.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.219.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.219.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.22.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.22.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.22.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.220.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.220.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.220.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.221.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.221.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.221.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.222.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.222.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.222.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.223.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.223.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.223.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.224.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.224.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.224.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.225.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.225.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.225.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.226.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.226.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.226.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.227.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.227.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.227.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.228.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.228.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.228.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.229.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.229.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.229.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.23.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.23.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.23.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.230.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.230.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.230.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.231.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.231.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.231.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.232.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.232.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.232.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.233.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.233.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.233.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.234.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.234.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.234.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.235.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.235.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.235.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.236.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.236.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.236.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.237.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.237.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.237.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.238.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.238.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.238.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.239.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.239.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.239.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.24.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.24.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.24.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.240.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.240.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.240.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.241.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.241.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.241.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.242.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.242.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.242.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.243.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.243.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.243.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.244.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.244.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.244.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.245.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.245.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.245.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.246.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.246.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.246.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.247.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.247.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.247.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.248.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.248.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.248.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.249.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.249.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.249.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.25.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.25.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.25.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.250.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.250.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.250.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.251.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.251.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.251.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.252.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.252.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.252.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.253.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.253.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.253.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.254.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.254.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.254.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.255.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.255.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.255.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.26.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.26.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.26.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.27.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.27.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.27.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.28.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.28.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.28.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.29.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.29.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.29.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.3.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.3.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.3.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.30.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.30.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.30.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.31.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.31.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.31.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.32.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.32.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.32.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.33.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.33.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.33.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.34.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.34.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.34.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.35.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.35.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.35.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.36.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.36.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.36.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.37.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.37.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.37.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.38.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.38.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.38.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.39.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.39.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.39.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.4.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.4.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.4.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.40.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.40.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.40.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.41.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.41.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.41.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.42.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.42.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.42.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.43.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.43.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.43.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.44.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.44.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.44.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.45.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.45.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.45.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.46.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.46.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.46.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.47.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.47.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.47.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.48.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.48.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.48.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.49.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.49.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.49.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.5.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.5.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.5.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.50.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.50.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.50.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.51.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.51.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.51.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.52.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.52.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.52.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.53.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.53.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.53.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.54.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.54.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.54.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.55.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.55.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.55.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.56.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.56.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.56.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.57.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.57.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.57.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.58.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.58.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.58.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.59.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.59.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.59.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.6.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.6.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.6.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.60.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.60.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.60.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.61.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.61.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.61.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.62.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.62.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.62.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.63.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.63.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.63.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.64.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.64.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.64.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.65.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.65.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.65.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.66.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.66.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.66.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.67.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.67.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.67.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.68.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.68.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.68.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.69.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.69.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.69.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.7.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.7.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.7.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.70.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.70.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.70.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.71.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.71.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.71.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.72.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.72.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.72.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.73.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.73.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.73.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.74.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.74.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.74.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.75.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.75.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.75.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.76.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.76.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.76.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.77.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.77.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.77.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.78.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.78.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.78.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.79.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.79.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.79.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.8.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.8.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.8.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.80.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.80.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.80.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.81.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.81.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.81.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.82.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.82.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.82.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.83.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.83.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.83.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.84.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.84.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.84.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.85.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.85.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.85.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.86.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.86.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.86.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.87.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.87.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.87.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.88.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.88.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.88.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.89.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.89.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.89.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.9.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.9.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.9.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.90.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.90.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.90.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.91.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.91.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.91.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.92.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.92.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.92.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.93.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.93.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.93.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.94.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.94.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.94.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.95.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.95.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.95.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.96.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.96.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.96.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.97.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.97.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.97.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.98.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.98.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.98.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.99.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.99.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.down_proj_list.99.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.0.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.0.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.0.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.1.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.1.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.1.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.10.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.10.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.10.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.100.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.100.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.100.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.101.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.101.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.101.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.102.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.102.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.102.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.103.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.103.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.103.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.104.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.104.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.104.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.105.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.105.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.105.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.106.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.106.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.106.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.107.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.107.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.107.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.108.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.108.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.108.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.109.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.109.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.109.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.11.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.11.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.11.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.110.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.110.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.110.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.111.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.111.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.111.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.112.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.112.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.112.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.113.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.113.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.113.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.114.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.114.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.114.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.115.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.115.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.115.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.116.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.116.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.116.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.117.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.117.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.117.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.118.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.118.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.118.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.119.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.119.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.119.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.12.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.12.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.12.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.120.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.120.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.120.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.121.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.121.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.121.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.122.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.122.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.122.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.123.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.123.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.123.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.124.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.124.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.124.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.125.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.125.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.125.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.126.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.126.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.126.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.127.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.127.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.127.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.128.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.128.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.128.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.129.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.129.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.129.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.13.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.13.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.13.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.130.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.130.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.130.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.131.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.131.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.131.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.132.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.132.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.132.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.133.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.133.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.133.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.134.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.134.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.134.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.135.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.135.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.135.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.136.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.136.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.136.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.137.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.137.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.137.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.138.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.138.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.138.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.139.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.139.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.139.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.14.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.14.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.14.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.140.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.140.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.140.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.141.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.141.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.141.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.142.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.142.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.142.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.143.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.143.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.143.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.144.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.144.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.144.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.145.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.145.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.145.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.146.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.146.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.146.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.147.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.147.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.147.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.148.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.148.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.148.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.149.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.149.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.149.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.15.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.15.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.15.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.150.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.150.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.150.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.151.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.151.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.151.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.152.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.152.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.152.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.153.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.153.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.153.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.154.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.154.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.154.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.155.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.155.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.155.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.156.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.156.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.156.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.157.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.157.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.157.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.158.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.158.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.158.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.159.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.159.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.159.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.16.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.16.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.16.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.160.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.160.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.160.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.161.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.161.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.161.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.162.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.162.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.162.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.163.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.163.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.163.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.164.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.164.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.164.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.165.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.165.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.165.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.166.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.166.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.166.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.167.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.167.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.167.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.168.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.168.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.168.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.169.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.169.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.169.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.17.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.17.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.17.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.170.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.170.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.170.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.171.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.171.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.171.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.172.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.172.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.172.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.173.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.173.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.173.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.174.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.174.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.174.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.175.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.175.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.175.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.176.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.176.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.176.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.177.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.177.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.177.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.178.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.178.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.178.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.179.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.179.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.179.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.18.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.18.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.18.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.180.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.180.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.180.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.181.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.181.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.181.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.182.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.182.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.182.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.183.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.183.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.183.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.184.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.184.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.184.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.185.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.185.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.185.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.186.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.186.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.186.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.187.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.187.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.187.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.188.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.188.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.188.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.189.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.189.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.189.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.19.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.19.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.19.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.190.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.190.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.190.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.191.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.191.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.191.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.192.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.192.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.192.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.193.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.193.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.193.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.194.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.194.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.194.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.195.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.195.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.195.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.196.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.196.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.196.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.197.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.197.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.197.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.198.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.198.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.198.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.199.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.199.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.199.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.2.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.2.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.2.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.20.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.20.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.20.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.200.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.200.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.200.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.201.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.201.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.201.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.202.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.202.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.202.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.203.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.203.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.203.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.204.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.204.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.204.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.205.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.205.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.205.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.206.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.206.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.206.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.207.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.207.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.207.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.208.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.208.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.208.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.209.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.209.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.209.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.21.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.21.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.21.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.210.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.210.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.210.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.211.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.211.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.211.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.212.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.212.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.212.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.213.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.213.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.213.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.214.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.214.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.214.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.215.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.215.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.215.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.216.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.216.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.216.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.217.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.217.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.217.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.218.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.218.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.218.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.219.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.219.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.219.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.22.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.22.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.22.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.220.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.220.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.220.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.221.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.221.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.221.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.222.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.222.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.222.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.223.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.223.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.223.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.224.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.224.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.224.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.225.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.225.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.225.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.226.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.226.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.226.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.227.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.227.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.227.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.228.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.228.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.228.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.229.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.229.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.229.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.23.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.23.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.23.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.230.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.230.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.230.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.231.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.231.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.231.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.232.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.232.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.232.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.233.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.233.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.233.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.234.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.234.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.234.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.235.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.235.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.235.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.236.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.236.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.236.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.237.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.237.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.237.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.238.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.238.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.238.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.239.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.239.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.239.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.24.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.24.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.24.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.240.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.240.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.240.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.241.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.241.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.241.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.242.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.242.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.242.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.243.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.243.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.243.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.244.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.244.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.244.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.245.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.245.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.245.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.246.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.246.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.246.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.247.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.247.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.247.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.248.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.248.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.248.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.249.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.249.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.249.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.25.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.25.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.25.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.250.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.250.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.250.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.251.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.251.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.251.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.252.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.252.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.252.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.253.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.253.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.253.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.254.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.254.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.254.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.255.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.255.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.255.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.26.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.26.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.26.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.27.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.27.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.27.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.28.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.28.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.28.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.29.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.29.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.29.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.3.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.3.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.3.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.30.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.30.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.30.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.31.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.31.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.31.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.32.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.32.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.32.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.33.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.33.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.33.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.34.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.34.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.34.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.35.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.35.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.35.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.36.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.36.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.36.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.37.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.37.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.37.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.38.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.38.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.38.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.39.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.39.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.39.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.4.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.4.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.4.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.40.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.40.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.40.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.41.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.41.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.41.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.42.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.42.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.42.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.43.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.43.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.43.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.44.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.44.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.44.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.45.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.45.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.45.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.46.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.46.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.46.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.47.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.47.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.47.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.48.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.48.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.48.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.49.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.49.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.49.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.5.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.5.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.5.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.50.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.50.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.50.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.51.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.51.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.51.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.52.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.52.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.52.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.53.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.53.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.53.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.54.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.54.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.54.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.55.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.55.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.55.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.56.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.56.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.56.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.57.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.57.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.57.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.58.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.58.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.58.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.59.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.59.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.59.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.6.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.6.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.6.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.60.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.60.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.60.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.61.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.61.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.61.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.62.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.62.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.62.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.63.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.63.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.63.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.64.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.64.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.64.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.65.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.65.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.65.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.66.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.66.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.66.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.67.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.67.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.67.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.68.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.68.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.68.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.69.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.69.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.69.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.7.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.7.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.7.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.70.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.70.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.70.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.71.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.71.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.71.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.72.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.72.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.72.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.73.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.73.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.73.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.74.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.74.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.74.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.75.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.75.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.75.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.76.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.76.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.76.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.77.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.77.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.77.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.78.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.78.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.78.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.79.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.79.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.79.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.8.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.8.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.8.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.80.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.80.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.80.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.81.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.81.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.81.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.82.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.82.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.82.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.83.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.83.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.83.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.84.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.84.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.84.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.85.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.85.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.85.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.86.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.86.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.86.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.87.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.87.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.87.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.88.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.88.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.88.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.89.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.89.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.89.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.9.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.9.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.9.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.90.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.90.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.90.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.91.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.91.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.91.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.92.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.92.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.92.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.93.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.93.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.93.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.94.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.94.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.94.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.95.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.95.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.95.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.96.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.96.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.96.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.97.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.97.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.97.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.98.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.98.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.98.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.99.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.99.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.experts.gate_up_proj_list.99.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.gate.weight": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.shared_expert.down_proj.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.shared_expert.down_proj.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.shared_expert.down_proj.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.shared_expert.gate_proj.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.shared_expert.gate_proj.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.shared_expert.gate_proj.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.shared_expert.up_proj.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.shared_expert.up_proj.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.shared_expert.up_proj.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.shared_expert_gate.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.shared_expert_gate.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.4.mlp.shared_expert_gate.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.4.post_attention_layernorm.weight": "model-00001-of-00004.safetensors", "model.language_model.layers.5.input_layernorm.weight": "model-00001-of-00004.safetensors", "model.language_model.layers.5.linear_attn.A_log": "model-00001-of-00004.safetensors", "model.language_model.layers.5.linear_attn.conv1d.weight": "model-00001-of-00004.safetensors", "model.language_model.layers.5.linear_attn.dt_bias": "model-00001-of-00004.safetensors", "model.language_model.layers.5.linear_attn.in_proj_a.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.linear_attn.in_proj_a.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.linear_attn.in_proj_a.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.linear_attn.in_proj_b.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.linear_attn.in_proj_b.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.linear_attn.in_proj_b.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.linear_attn.in_proj_qkv.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.linear_attn.in_proj_qkv.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.linear_attn.in_proj_qkv.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.linear_attn.in_proj_z.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.linear_attn.in_proj_z.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.linear_attn.in_proj_z.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.linear_attn.norm.weight": "model-00001-of-00004.safetensors", "model.language_model.layers.5.linear_attn.out_proj.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.linear_attn.out_proj.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.linear_attn.out_proj.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.0.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.0.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.0.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.1.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.1.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.1.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.10.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.10.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.10.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.100.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.100.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.100.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.101.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.101.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.101.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.102.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.102.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.102.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.103.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.103.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.103.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.104.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.104.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.104.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.105.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.105.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.105.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.106.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.106.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.106.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.107.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.107.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.107.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.108.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.108.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.108.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.109.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.109.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.109.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.11.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.11.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.11.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.110.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.110.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.110.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.111.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.111.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.111.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.112.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.112.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.112.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.113.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.113.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.113.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.114.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.114.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.114.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.115.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.115.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.115.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.116.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.116.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.116.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.117.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.117.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.117.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.118.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.118.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.118.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.119.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.119.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.119.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.12.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.12.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.12.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.120.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.120.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.120.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.121.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.121.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.121.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.122.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.122.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.122.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.123.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.123.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.123.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.124.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.124.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.124.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.125.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.125.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.125.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.126.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.126.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.126.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.127.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.127.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.127.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.128.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.128.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.128.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.129.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.129.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.129.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.13.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.13.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.13.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.130.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.130.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.130.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.131.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.131.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.131.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.132.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.132.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.132.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.133.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.133.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.133.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.134.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.134.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.134.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.135.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.135.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.135.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.136.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.136.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.136.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.137.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.137.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.137.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.138.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.138.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.138.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.139.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.139.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.139.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.14.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.14.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.14.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.140.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.140.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.140.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.141.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.141.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.141.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.142.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.142.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.142.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.143.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.143.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.143.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.144.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.144.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.144.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.145.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.145.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.145.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.146.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.146.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.146.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.147.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.147.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.147.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.148.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.148.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.148.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.149.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.149.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.149.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.15.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.15.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.15.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.150.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.150.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.150.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.151.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.151.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.151.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.152.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.152.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.152.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.153.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.153.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.153.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.154.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.154.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.154.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.155.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.155.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.155.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.156.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.156.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.156.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.157.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.157.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.157.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.158.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.158.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.158.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.159.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.159.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.159.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.16.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.16.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.16.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.160.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.160.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.160.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.161.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.161.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.161.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.162.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.162.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.162.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.163.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.163.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.163.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.164.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.164.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.164.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.165.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.165.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.165.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.166.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.166.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.166.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.167.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.167.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.167.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.168.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.168.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.168.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.169.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.169.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.169.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.17.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.17.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.17.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.170.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.170.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.170.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.171.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.171.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.171.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.172.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.172.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.172.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.173.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.173.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.173.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.174.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.174.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.174.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.175.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.175.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.175.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.176.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.176.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.176.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.177.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.177.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.177.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.178.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.178.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.178.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.179.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.179.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.179.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.18.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.18.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.18.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.180.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.180.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.180.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.181.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.181.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.181.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.182.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.182.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.182.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.183.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.183.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.183.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.184.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.184.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.184.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.185.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.185.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.185.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.186.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.186.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.186.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.187.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.187.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.187.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.188.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.188.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.188.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.189.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.189.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.189.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.19.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.19.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.19.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.190.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.190.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.190.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.191.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.191.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.191.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.192.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.192.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.192.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.193.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.193.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.193.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.194.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.194.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.194.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.195.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.195.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.195.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.196.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.196.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.196.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.197.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.197.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.197.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.198.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.198.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.198.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.199.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.199.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.199.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.2.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.2.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.2.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.20.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.20.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.20.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.200.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.200.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.200.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.201.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.201.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.201.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.202.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.202.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.202.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.203.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.203.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.203.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.204.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.204.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.204.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.205.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.205.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.205.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.206.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.206.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.206.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.207.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.207.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.207.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.208.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.208.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.208.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.209.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.209.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.209.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.21.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.21.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.21.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.210.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.210.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.210.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.211.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.211.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.211.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.212.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.212.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.212.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.213.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.213.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.213.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.214.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.214.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.214.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.215.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.215.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.215.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.216.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.216.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.216.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.217.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.217.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.217.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.218.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.218.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.218.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.219.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.219.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.219.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.22.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.22.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.22.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.220.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.220.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.220.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.221.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.221.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.221.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.222.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.222.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.222.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.223.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.223.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.223.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.224.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.224.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.224.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.225.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.225.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.225.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.226.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.226.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.226.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.227.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.227.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.227.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.228.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.228.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.228.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.229.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.229.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.229.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.23.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.23.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.23.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.230.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.230.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.230.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.231.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.231.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.231.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.232.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.232.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.232.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.233.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.233.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.233.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.234.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.234.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.234.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.235.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.235.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.235.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.236.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.236.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.236.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.237.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.237.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.237.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.238.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.238.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.238.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.239.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.239.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.239.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.24.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.24.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.24.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.240.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.240.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.240.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.241.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.241.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.241.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.242.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.242.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.242.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.243.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.243.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.243.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.244.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.244.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.244.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.245.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.245.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.245.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.246.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.246.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.246.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.247.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.247.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.247.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.248.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.248.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.248.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.249.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.249.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.249.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.25.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.25.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.25.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.250.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.250.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.250.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.251.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.251.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.251.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.252.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.252.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.252.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.253.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.253.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.253.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.254.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.254.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.254.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.255.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.255.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.255.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.26.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.26.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.26.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.27.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.27.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.27.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.28.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.28.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.28.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.29.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.29.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.29.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.3.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.3.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.3.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.30.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.30.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.30.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.31.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.31.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.31.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.32.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.32.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.32.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.33.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.33.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.33.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.34.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.34.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.34.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.35.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.35.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.35.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.36.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.36.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.36.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.37.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.37.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.37.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.38.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.38.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.38.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.39.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.39.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.39.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.4.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.4.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.4.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.40.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.40.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.40.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.41.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.41.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.41.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.42.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.42.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.42.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.43.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.43.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.43.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.44.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.44.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.44.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.45.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.45.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.45.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.46.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.46.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.46.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.47.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.47.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.47.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.48.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.48.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.48.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.49.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.49.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.49.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.5.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.5.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.5.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.50.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.50.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.50.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.51.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.51.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.51.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.52.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.52.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.52.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.53.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.53.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.53.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.54.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.54.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.54.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.55.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.55.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.55.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.56.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.56.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.56.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.57.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.57.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.57.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.58.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.58.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.58.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.59.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.59.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.59.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.6.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.6.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.6.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.60.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.60.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.60.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.61.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.61.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.61.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.62.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.62.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.62.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.63.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.63.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.63.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.64.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.64.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.64.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.65.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.65.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.65.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.66.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.66.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.66.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.67.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.67.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.67.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.68.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.68.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.68.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.69.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.69.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.69.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.7.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.7.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.7.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.70.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.70.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.70.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.71.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.71.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.71.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.72.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.72.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.72.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.73.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.73.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.73.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.74.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.74.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.74.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.75.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.75.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.75.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.76.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.76.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.76.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.77.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.77.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.77.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.78.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.78.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.78.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.79.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.79.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.79.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.8.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.8.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.8.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.80.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.80.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.80.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.81.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.81.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.81.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.82.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.82.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.82.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.83.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.83.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.83.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.84.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.84.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.84.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.85.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.85.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.85.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.86.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.86.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.86.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.87.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.87.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.87.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.88.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.88.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.88.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.89.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.89.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.89.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.9.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.9.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.9.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.90.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.90.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.90.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.91.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.91.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.91.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.92.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.92.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.92.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.93.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.93.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.93.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.94.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.94.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.94.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.95.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.95.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.95.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.96.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.96.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.96.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.97.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.97.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.97.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.98.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.98.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.98.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.99.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.99.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.down_proj_list.99.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.0.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.0.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.0.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.1.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.1.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.1.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.10.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.10.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.10.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.100.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.100.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.100.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.101.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.101.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.101.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.102.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.102.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.102.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.103.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.103.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.103.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.104.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.104.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.104.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.105.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.105.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.105.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.106.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.106.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.106.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.107.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.107.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.107.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.108.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.108.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.108.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.109.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.109.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.109.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.11.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.11.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.11.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.110.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.110.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.110.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.111.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.111.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.111.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.112.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.112.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.112.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.113.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.113.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.113.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.114.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.114.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.114.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.115.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.115.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.115.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.116.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.116.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.116.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.117.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.117.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.117.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.118.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.118.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.118.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.119.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.119.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.119.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.12.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.12.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.12.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.120.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.120.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.120.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.121.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.121.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.121.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.122.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.122.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.122.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.123.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.123.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.123.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.124.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.124.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.124.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.125.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.125.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.125.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.126.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.126.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.126.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.127.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.127.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.127.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.128.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.128.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.128.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.129.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.129.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.129.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.13.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.13.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.13.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.130.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.130.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.130.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.131.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.131.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.131.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.132.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.132.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.132.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.133.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.133.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.133.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.134.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.134.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.134.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.135.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.135.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.135.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.136.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.136.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.136.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.137.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.137.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.137.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.138.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.138.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.138.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.139.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.139.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.139.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.14.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.14.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.14.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.140.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.140.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.140.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.141.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.141.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.141.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.142.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.142.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.142.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.143.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.143.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.143.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.144.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.144.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.144.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.145.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.145.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.145.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.146.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.146.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.146.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.147.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.147.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.147.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.148.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.148.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.148.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.149.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.149.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.149.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.15.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.15.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.15.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.150.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.150.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.150.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.151.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.151.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.151.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.152.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.152.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.152.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.153.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.153.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.153.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.154.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.154.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.154.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.155.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.155.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.155.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.156.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.156.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.156.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.157.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.157.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.157.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.158.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.158.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.158.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.159.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.159.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.159.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.16.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.16.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.16.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.160.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.160.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.160.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.161.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.161.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.161.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.162.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.162.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.162.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.163.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.163.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.163.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.164.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.164.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.164.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.165.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.165.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.165.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.166.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.166.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.166.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.167.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.167.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.167.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.168.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.168.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.168.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.169.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.169.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.169.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.17.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.17.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.17.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.170.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.170.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.170.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.171.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.171.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.171.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.172.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.172.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.172.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.173.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.173.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.173.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.174.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.174.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.174.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.175.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.175.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.175.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.176.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.176.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.176.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.177.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.177.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.177.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.178.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.178.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.178.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.179.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.179.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.179.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.18.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.18.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.18.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.180.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.180.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.180.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.181.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.181.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.181.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.182.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.182.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.182.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.183.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.183.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.183.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.184.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.184.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.184.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.185.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.185.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.185.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.186.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.186.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.186.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.187.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.187.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.187.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.188.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.188.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.188.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.189.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.189.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.189.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.19.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.19.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.19.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.190.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.190.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.190.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.191.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.191.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.191.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.192.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.192.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.192.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.193.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.193.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.193.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.194.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.194.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.194.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.195.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.195.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.195.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.196.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.196.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.196.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.197.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.197.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.197.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.198.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.198.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.198.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.199.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.199.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.199.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.2.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.2.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.2.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.20.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.20.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.20.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.200.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.200.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.200.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.201.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.201.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.201.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.202.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.202.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.202.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.203.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.203.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.203.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.204.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.204.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.204.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.205.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.205.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.205.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.206.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.206.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.206.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.207.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.207.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.207.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.208.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.208.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.208.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.209.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.209.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.209.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.21.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.21.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.21.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.210.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.210.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.210.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.211.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.211.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.211.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.212.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.212.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.212.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.213.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.213.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.213.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.214.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.214.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.214.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.215.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.215.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.215.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.216.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.216.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.216.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.217.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.217.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.217.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.218.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.218.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.218.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.219.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.219.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.219.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.22.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.22.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.22.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.220.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.220.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.220.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.221.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.221.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.221.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.222.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.222.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.222.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.223.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.223.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.223.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.224.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.224.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.224.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.225.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.225.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.225.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.226.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.226.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.226.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.227.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.227.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.227.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.228.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.228.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.228.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.229.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.229.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.229.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.23.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.23.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.23.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.230.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.230.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.230.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.231.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.231.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.231.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.232.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.232.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.232.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.233.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.233.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.233.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.234.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.234.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.234.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.235.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.235.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.235.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.236.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.236.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.236.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.237.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.237.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.237.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.238.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.238.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.238.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.239.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.239.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.239.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.24.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.24.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.24.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.240.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.240.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.240.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.241.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.241.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.241.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.242.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.242.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.242.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.243.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.243.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.243.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.244.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.244.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.244.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.245.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.245.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.245.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.246.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.246.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.246.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.247.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.247.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.247.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.248.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.248.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.248.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.249.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.249.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.249.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.25.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.25.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.25.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.250.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.250.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.250.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.251.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.251.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.251.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.252.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.252.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.252.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.253.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.253.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.253.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.254.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.254.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.254.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.255.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.255.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.255.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.26.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.26.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.26.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.27.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.27.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.27.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.28.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.28.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.28.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.29.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.29.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.29.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.3.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.3.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.3.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.30.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.30.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.30.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.31.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.31.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.31.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.32.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.32.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.32.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.33.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.33.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.33.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.34.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.34.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.34.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.35.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.35.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.35.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.36.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.36.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.36.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.37.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.37.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.37.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.38.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.38.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.38.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.39.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.39.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.39.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.4.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.4.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.4.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.40.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.40.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.40.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.41.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.41.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.41.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.42.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.42.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.42.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.43.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.43.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.43.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.44.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.44.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.44.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.45.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.45.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.45.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.46.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.46.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.46.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.47.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.47.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.47.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.48.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.48.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.48.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.49.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.49.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.49.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.5.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.5.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.5.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.50.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.50.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.50.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.51.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.51.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.51.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.52.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.52.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.52.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.53.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.53.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.53.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.54.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.54.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.54.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.55.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.55.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.55.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.56.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.56.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.56.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.57.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.57.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.57.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.58.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.58.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.58.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.59.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.59.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.59.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.6.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.6.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.6.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.60.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.60.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.60.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.61.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.61.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.61.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.62.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.62.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.62.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.63.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.63.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.63.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.64.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.64.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.64.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.65.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.65.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.65.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.66.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.66.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.66.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.67.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.67.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.67.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.68.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.68.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.68.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.69.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.69.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.69.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.7.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.7.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.7.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.70.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.70.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.70.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.71.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.71.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.71.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.72.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.72.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.72.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.73.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.73.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.73.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.74.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.74.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.74.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.75.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.75.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.75.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.76.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.76.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.76.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.77.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.77.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.77.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.78.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.78.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.78.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.79.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.79.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.79.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.8.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.8.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.8.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.80.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.80.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.80.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.81.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.81.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.81.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.82.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.82.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.82.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.83.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.83.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.83.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.84.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.84.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.84.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.85.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.85.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.85.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.86.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.86.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.86.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.87.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.87.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.87.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.88.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.88.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.88.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.89.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.89.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.89.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.9.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.9.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.9.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.90.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.90.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.90.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.91.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.91.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.91.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.92.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.92.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.92.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.93.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.93.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.93.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.94.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.94.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.94.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.95.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.95.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.95.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.96.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.96.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.96.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.97.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.97.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.97.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.98.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.98.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.98.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.99.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.99.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.experts.gate_up_proj_list.99.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.gate.weight": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.shared_expert.down_proj.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.shared_expert.down_proj.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.shared_expert.down_proj.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.shared_expert.gate_proj.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.shared_expert.gate_proj.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.shared_expert.gate_proj.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.shared_expert.up_proj.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.shared_expert.up_proj.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.shared_expert.up_proj.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.shared_expert_gate.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.shared_expert_gate.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.5.mlp.shared_expert_gate.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.5.post_attention_layernorm.weight": "model-00001-of-00004.safetensors", "model.language_model.layers.6.input_layernorm.weight": "model-00001-of-00004.safetensors", "model.language_model.layers.6.linear_attn.A_log": "model-00001-of-00004.safetensors", "model.language_model.layers.6.linear_attn.conv1d.weight": "model-00001-of-00004.safetensors", "model.language_model.layers.6.linear_attn.dt_bias": "model-00001-of-00004.safetensors", "model.language_model.layers.6.linear_attn.in_proj_a.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.linear_attn.in_proj_a.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.linear_attn.in_proj_a.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.linear_attn.in_proj_b.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.linear_attn.in_proj_b.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.linear_attn.in_proj_b.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.linear_attn.in_proj_qkv.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.linear_attn.in_proj_qkv.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.linear_attn.in_proj_qkv.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.linear_attn.in_proj_z.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.linear_attn.in_proj_z.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.linear_attn.in_proj_z.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.linear_attn.norm.weight": "model-00001-of-00004.safetensors", "model.language_model.layers.6.linear_attn.out_proj.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.linear_attn.out_proj.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.linear_attn.out_proj.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.0.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.0.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.0.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.1.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.1.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.1.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.10.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.10.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.10.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.100.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.100.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.100.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.101.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.101.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.101.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.102.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.102.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.102.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.103.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.103.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.103.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.104.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.104.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.104.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.105.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.105.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.105.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.106.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.106.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.106.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.107.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.107.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.107.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.108.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.108.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.108.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.109.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.109.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.109.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.11.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.11.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.11.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.110.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.110.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.110.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.111.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.111.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.111.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.112.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.112.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.112.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.113.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.113.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.113.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.114.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.114.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.114.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.115.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.115.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.115.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.116.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.116.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.116.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.117.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.117.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.117.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.118.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.118.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.118.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.119.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.119.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.119.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.12.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.12.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.12.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.120.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.120.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.120.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.121.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.121.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.121.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.122.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.122.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.122.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.123.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.123.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.123.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.124.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.124.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.124.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.125.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.125.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.125.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.126.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.126.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.126.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.127.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.127.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.127.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.128.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.128.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.128.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.129.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.129.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.129.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.13.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.13.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.13.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.130.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.130.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.130.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.131.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.131.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.131.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.132.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.132.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.132.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.133.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.133.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.133.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.134.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.134.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.134.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.135.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.135.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.135.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.136.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.136.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.136.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.137.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.137.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.137.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.138.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.138.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.138.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.139.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.139.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.139.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.14.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.14.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.14.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.140.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.140.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.140.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.141.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.141.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.141.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.142.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.142.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.142.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.143.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.143.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.143.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.144.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.144.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.144.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.145.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.145.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.145.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.146.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.146.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.146.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.147.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.147.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.147.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.148.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.148.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.148.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.149.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.149.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.149.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.15.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.15.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.15.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.150.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.150.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.150.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.151.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.151.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.151.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.152.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.152.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.152.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.153.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.153.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.153.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.154.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.154.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.154.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.155.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.155.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.155.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.156.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.156.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.156.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.157.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.157.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.157.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.158.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.158.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.158.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.159.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.159.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.159.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.16.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.16.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.16.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.160.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.160.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.160.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.161.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.161.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.161.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.162.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.162.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.162.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.163.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.163.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.163.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.164.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.164.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.164.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.165.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.165.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.165.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.166.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.166.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.166.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.167.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.167.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.167.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.168.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.168.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.168.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.169.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.169.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.169.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.17.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.17.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.17.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.170.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.170.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.170.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.171.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.171.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.171.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.172.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.172.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.172.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.173.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.173.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.173.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.174.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.174.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.174.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.175.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.175.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.175.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.176.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.176.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.176.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.177.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.177.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.177.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.178.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.178.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.178.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.179.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.179.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.179.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.18.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.18.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.18.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.180.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.180.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.180.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.181.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.181.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.181.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.182.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.182.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.182.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.183.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.183.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.183.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.184.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.184.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.184.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.185.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.185.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.185.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.186.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.186.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.186.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.187.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.187.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.187.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.188.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.188.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.188.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.189.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.189.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.189.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.19.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.19.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.19.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.190.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.190.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.190.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.191.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.191.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.191.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.192.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.192.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.192.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.193.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.193.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.193.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.194.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.194.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.194.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.195.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.195.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.195.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.196.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.196.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.196.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.197.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.197.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.197.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.198.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.198.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.198.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.199.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.199.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.199.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.2.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.2.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.2.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.20.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.20.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.20.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.200.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.200.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.200.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.201.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.201.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.201.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.202.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.202.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.202.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.203.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.203.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.203.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.204.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.204.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.204.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.205.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.205.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.205.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.206.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.206.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.206.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.207.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.207.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.207.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.208.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.208.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.208.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.209.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.209.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.209.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.21.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.21.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.21.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.210.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.210.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.210.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.211.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.211.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.211.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.212.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.212.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.212.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.213.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.213.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.213.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.214.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.214.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.214.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.215.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.215.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.215.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.216.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.216.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.216.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.217.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.217.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.217.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.218.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.218.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.218.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.219.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.219.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.219.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.22.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.22.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.22.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.220.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.220.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.220.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.221.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.221.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.221.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.222.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.222.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.222.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.223.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.223.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.223.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.224.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.224.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.224.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.225.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.225.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.225.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.226.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.226.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.226.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.227.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.227.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.227.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.228.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.228.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.228.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.229.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.229.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.229.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.23.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.23.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.23.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.230.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.230.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.230.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.231.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.231.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.231.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.232.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.232.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.232.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.233.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.233.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.233.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.234.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.234.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.234.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.235.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.235.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.235.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.236.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.236.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.236.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.237.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.237.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.237.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.238.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.238.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.238.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.239.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.239.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.239.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.24.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.24.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.24.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.240.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.240.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.240.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.241.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.241.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.241.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.242.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.242.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.242.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.243.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.243.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.243.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.244.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.244.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.244.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.245.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.245.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.245.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.246.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.246.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.246.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.247.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.247.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.247.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.248.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.248.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.248.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.249.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.249.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.249.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.25.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.25.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.25.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.250.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.250.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.250.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.251.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.251.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.251.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.252.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.252.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.252.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.253.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.253.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.253.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.254.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.254.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.254.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.255.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.255.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.255.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.26.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.26.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.26.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.27.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.27.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.27.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.28.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.28.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.28.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.29.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.29.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.29.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.3.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.3.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.3.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.30.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.30.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.30.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.31.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.31.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.31.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.32.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.32.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.32.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.33.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.33.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.33.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.34.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.34.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.34.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.35.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.35.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.35.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.36.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.36.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.36.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.37.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.37.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.37.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.38.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.38.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.38.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.39.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.39.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.39.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.4.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.4.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.4.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.40.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.40.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.40.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.41.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.41.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.41.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.42.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.42.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.42.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.43.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.43.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.43.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.44.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.44.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.44.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.45.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.45.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.45.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.46.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.46.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.46.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.47.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.47.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.47.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.48.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.48.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.48.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.49.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.49.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.49.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.5.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.5.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.5.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.50.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.50.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.50.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.51.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.51.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.51.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.52.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.52.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.52.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.53.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.53.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.53.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.54.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.54.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.54.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.55.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.55.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.55.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.56.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.56.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.56.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.57.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.57.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.57.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.58.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.58.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.58.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.59.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.59.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.59.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.6.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.6.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.6.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.60.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.60.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.60.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.61.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.61.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.61.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.62.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.62.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.62.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.63.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.63.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.63.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.64.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.64.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.64.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.65.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.65.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.65.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.66.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.66.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.66.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.67.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.67.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.67.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.68.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.68.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.68.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.69.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.69.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.69.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.7.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.7.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.7.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.70.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.70.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.70.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.71.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.71.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.71.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.72.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.72.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.72.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.73.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.73.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.73.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.74.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.74.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.74.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.75.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.75.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.75.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.76.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.76.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.76.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.77.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.77.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.77.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.78.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.78.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.78.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.79.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.79.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.79.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.8.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.8.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.8.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.80.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.80.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.80.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.81.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.81.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.81.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.82.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.82.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.82.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.83.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.83.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.83.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.84.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.84.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.84.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.85.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.85.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.85.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.86.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.86.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.86.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.87.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.87.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.87.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.88.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.88.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.88.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.89.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.89.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.89.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.9.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.9.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.9.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.90.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.90.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.90.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.91.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.91.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.91.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.92.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.92.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.92.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.93.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.93.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.93.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.94.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.94.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.94.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.95.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.95.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.95.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.96.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.96.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.96.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.97.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.97.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.97.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.98.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.98.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.98.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.99.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.99.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.down_proj_list.99.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.0.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.0.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.0.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.1.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.1.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.1.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.10.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.10.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.10.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.100.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.100.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.100.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.101.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.101.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.101.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.102.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.102.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.102.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.103.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.103.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.103.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.104.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.104.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.104.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.105.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.105.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.105.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.106.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.106.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.106.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.107.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.107.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.107.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.108.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.108.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.108.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.109.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.109.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.109.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.11.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.11.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.11.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.110.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.110.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.110.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.111.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.111.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.111.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.112.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.112.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.112.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.113.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.113.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.113.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.114.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.114.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.114.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.115.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.115.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.115.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.116.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.116.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.116.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.117.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.117.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.117.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.118.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.118.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.118.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.119.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.119.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.119.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.12.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.12.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.12.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.120.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.120.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.120.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.121.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.121.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.121.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.122.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.122.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.122.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.123.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.123.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.123.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.124.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.124.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.124.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.125.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.125.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.125.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.126.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.126.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.126.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.127.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.127.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.127.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.128.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.128.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.128.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.129.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.129.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.129.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.13.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.13.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.13.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.130.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.130.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.130.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.131.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.131.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.131.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.132.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.132.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.132.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.133.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.133.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.133.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.134.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.134.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.134.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.135.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.135.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.135.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.136.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.136.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.136.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.137.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.137.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.137.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.138.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.138.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.138.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.139.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.139.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.139.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.14.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.14.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.14.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.140.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.140.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.140.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.141.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.141.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.141.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.142.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.142.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.142.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.143.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.143.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.143.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.144.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.144.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.144.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.145.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.145.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.145.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.146.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.146.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.146.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.147.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.147.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.147.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.148.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.148.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.148.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.149.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.149.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.149.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.15.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.15.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.15.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.150.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.150.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.150.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.151.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.151.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.151.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.152.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.152.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.152.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.153.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.153.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.153.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.154.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.154.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.154.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.155.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.155.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.155.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.156.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.156.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.156.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.157.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.157.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.157.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.158.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.158.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.158.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.159.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.159.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.159.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.16.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.16.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.16.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.160.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.160.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.160.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.161.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.161.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.161.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.162.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.162.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.162.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.163.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.163.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.163.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.164.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.164.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.164.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.165.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.165.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.165.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.166.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.166.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.166.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.167.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.167.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.167.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.168.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.168.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.168.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.169.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.169.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.169.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.17.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.17.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.17.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.170.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.170.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.170.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.171.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.171.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.171.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.172.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.172.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.172.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.173.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.173.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.173.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.174.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.174.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.174.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.175.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.175.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.175.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.176.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.176.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.176.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.177.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.177.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.177.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.178.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.178.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.178.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.179.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.179.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.179.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.18.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.18.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.18.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.180.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.180.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.180.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.181.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.181.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.181.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.182.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.182.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.182.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.183.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.183.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.183.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.184.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.184.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.184.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.185.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.185.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.185.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.186.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.186.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.186.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.187.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.187.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.187.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.188.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.188.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.188.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.189.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.189.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.189.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.19.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.19.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.19.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.190.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.190.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.190.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.191.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.191.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.191.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.192.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.192.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.192.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.193.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.193.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.193.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.194.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.194.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.194.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.195.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.195.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.195.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.196.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.196.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.196.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.197.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.197.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.197.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.198.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.198.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.198.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.199.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.199.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.199.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.2.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.2.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.2.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.20.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.20.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.20.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.200.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.200.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.200.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.201.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.201.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.201.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.202.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.202.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.202.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.203.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.203.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.203.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.204.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.204.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.204.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.205.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.205.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.205.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.206.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.206.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.206.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.207.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.207.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.207.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.208.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.208.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.208.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.209.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.209.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.209.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.21.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.21.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.21.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.210.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.210.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.210.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.211.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.211.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.211.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.212.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.212.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.212.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.213.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.213.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.213.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.214.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.214.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.214.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.215.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.215.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.215.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.216.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.216.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.216.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.217.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.217.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.217.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.218.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.218.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.218.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.219.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.219.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.219.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.22.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.22.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.22.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.220.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.220.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.220.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.221.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.221.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.221.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.222.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.222.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.222.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.223.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.223.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.223.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.224.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.224.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.224.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.225.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.225.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.225.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.226.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.226.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.226.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.227.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.227.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.227.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.228.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.228.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.228.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.229.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.229.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.229.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.23.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.23.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.23.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.230.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.230.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.230.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.231.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.231.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.231.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.232.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.232.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.232.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.233.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.233.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.233.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.234.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.234.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.234.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.235.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.235.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.235.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.236.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.236.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.236.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.237.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.237.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.237.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.238.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.238.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.238.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.239.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.239.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.239.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.24.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.24.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.24.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.240.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.240.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.240.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.241.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.241.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.241.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.242.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.242.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.242.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.243.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.243.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.243.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.244.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.244.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.244.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.245.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.245.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.245.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.246.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.246.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.246.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.247.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.247.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.247.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.248.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.248.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.248.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.249.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.249.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.249.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.25.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.25.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.25.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.250.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.250.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.250.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.251.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.251.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.251.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.252.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.252.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.252.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.253.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.253.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.253.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.254.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.254.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.254.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.255.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.255.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.255.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.26.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.26.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.26.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.27.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.27.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.27.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.28.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.28.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.28.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.29.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.29.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.29.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.3.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.3.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.3.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.30.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.30.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.30.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.31.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.31.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.31.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.32.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.32.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.32.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.33.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.33.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.33.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.34.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.34.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.34.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.35.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.35.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.35.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.36.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.36.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.36.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.37.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.37.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.37.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.38.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.38.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.38.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.39.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.39.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.39.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.4.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.4.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.4.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.40.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.40.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.40.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.41.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.41.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.41.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.42.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.42.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.42.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.43.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.43.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.43.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.44.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.44.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.44.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.45.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.45.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.45.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.46.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.46.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.46.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.47.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.47.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.47.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.48.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.48.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.48.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.49.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.49.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.49.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.5.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.5.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.5.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.50.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.50.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.50.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.51.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.51.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.51.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.52.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.52.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.52.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.53.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.53.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.53.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.54.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.54.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.54.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.55.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.55.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.55.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.56.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.56.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.56.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.57.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.57.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.57.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.58.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.58.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.58.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.59.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.59.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.59.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.6.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.6.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.6.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.60.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.60.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.60.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.61.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.61.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.61.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.62.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.62.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.62.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.63.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.63.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.63.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.64.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.64.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.64.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.65.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.65.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.65.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.66.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.66.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.66.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.67.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.67.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.67.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.68.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.68.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.68.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.69.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.69.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.69.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.7.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.7.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.7.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.70.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.70.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.70.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.71.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.71.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.71.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.72.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.72.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.72.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.73.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.73.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.73.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.74.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.74.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.74.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.75.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.75.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.75.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.76.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.76.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.76.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.77.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.77.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.77.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.78.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.78.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.78.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.79.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.79.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.79.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.8.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.8.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.8.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.80.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.80.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.80.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.81.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.81.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.81.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.82.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.82.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.82.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.83.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.83.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.83.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.84.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.84.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.84.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.85.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.85.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.85.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.86.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.86.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.86.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.87.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.87.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.87.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.88.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.88.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.88.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.89.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.89.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.89.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.9.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.9.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.9.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.90.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.90.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.90.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.91.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.91.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.91.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.92.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.92.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.92.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.93.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.93.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.93.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.94.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.94.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.94.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.95.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.95.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.95.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.96.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.96.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.96.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.97.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.97.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.97.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.98.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.98.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.98.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.99.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.99.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.experts.gate_up_proj_list.99.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.gate.weight": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.shared_expert.down_proj.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.shared_expert.down_proj.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.shared_expert.down_proj.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.shared_expert.gate_proj.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.shared_expert.gate_proj.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.shared_expert.gate_proj.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.shared_expert.up_proj.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.shared_expert.up_proj.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.shared_expert.up_proj.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.shared_expert_gate.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.shared_expert_gate.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.6.mlp.shared_expert_gate.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.6.post_attention_layernorm.weight": "model-00001-of-00004.safetensors", "model.language_model.layers.7.input_layernorm.weight": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.0.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.0.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.0.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.1.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.1.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.1.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.10.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.10.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.10.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.100.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.100.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.100.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.101.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.101.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.101.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.102.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.102.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.102.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.103.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.103.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.103.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.104.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.104.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.104.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.105.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.105.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.105.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.106.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.106.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.106.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.107.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.107.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.107.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.108.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.108.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.108.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.109.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.109.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.109.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.11.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.11.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.11.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.110.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.110.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.110.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.111.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.111.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.111.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.112.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.112.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.112.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.113.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.113.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.113.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.114.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.114.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.114.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.115.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.115.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.115.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.116.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.116.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.116.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.117.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.117.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.117.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.118.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.118.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.118.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.119.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.119.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.119.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.12.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.12.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.12.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.120.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.120.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.120.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.121.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.121.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.121.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.122.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.122.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.122.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.123.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.123.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.123.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.124.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.124.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.124.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.125.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.125.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.125.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.126.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.126.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.126.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.127.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.127.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.127.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.128.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.128.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.128.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.129.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.129.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.129.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.13.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.13.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.13.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.130.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.130.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.130.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.131.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.131.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.131.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.132.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.132.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.132.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.133.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.133.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.133.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.134.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.134.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.134.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.135.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.135.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.135.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.136.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.136.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.136.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.137.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.137.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.137.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.138.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.138.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.138.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.139.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.139.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.139.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.14.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.14.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.14.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.140.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.140.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.140.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.141.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.141.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.141.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.142.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.142.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.142.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.143.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.143.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.143.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.144.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.144.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.144.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.145.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.145.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.145.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.146.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.146.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.146.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.147.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.147.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.147.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.148.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.148.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.148.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.149.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.149.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.149.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.15.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.15.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.15.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.150.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.150.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.150.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.151.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.151.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.151.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.152.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.152.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.152.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.153.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.153.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.153.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.154.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.154.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.154.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.155.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.155.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.155.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.156.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.156.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.156.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.157.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.157.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.157.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.158.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.158.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.158.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.159.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.159.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.159.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.16.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.16.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.16.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.160.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.160.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.160.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.161.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.161.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.161.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.162.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.162.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.162.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.163.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.163.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.163.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.164.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.164.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.164.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.165.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.165.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.165.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.166.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.166.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.166.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.167.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.167.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.167.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.168.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.168.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.168.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.169.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.169.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.169.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.17.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.17.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.17.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.170.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.170.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.170.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.171.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.171.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.171.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.172.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.172.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.172.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.173.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.173.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.173.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.174.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.174.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.174.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.175.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.175.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.175.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.176.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.176.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.176.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.177.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.177.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.177.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.178.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.178.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.178.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.179.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.179.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.179.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.18.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.18.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.18.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.180.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.180.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.180.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.181.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.181.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.181.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.182.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.182.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.182.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.183.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.183.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.183.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.184.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.184.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.184.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.185.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.185.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.185.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.186.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.186.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.186.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.187.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.187.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.187.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.188.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.188.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.188.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.189.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.189.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.189.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.19.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.19.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.19.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.190.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.190.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.190.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.191.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.191.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.191.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.192.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.192.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.192.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.193.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.193.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.193.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.194.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.194.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.194.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.195.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.195.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.195.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.196.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.196.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.196.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.197.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.197.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.197.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.198.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.198.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.198.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.199.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.199.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.199.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.2.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.2.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.2.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.20.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.20.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.20.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.200.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.200.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.200.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.201.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.201.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.201.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.202.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.202.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.202.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.203.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.203.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.203.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.204.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.204.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.204.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.205.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.205.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.205.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.206.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.206.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.206.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.207.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.207.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.207.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.208.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.208.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.208.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.209.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.209.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.209.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.21.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.21.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.21.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.210.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.210.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.210.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.211.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.211.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.211.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.212.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.212.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.212.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.213.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.213.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.213.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.214.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.214.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.214.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.215.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.215.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.215.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.216.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.216.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.216.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.217.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.217.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.217.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.218.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.218.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.218.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.219.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.219.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.219.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.22.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.22.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.22.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.220.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.220.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.220.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.221.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.221.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.221.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.222.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.222.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.222.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.223.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.223.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.223.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.224.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.224.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.224.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.225.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.225.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.225.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.226.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.226.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.226.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.227.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.227.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.227.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.228.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.228.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.228.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.229.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.229.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.229.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.23.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.23.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.23.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.230.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.230.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.230.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.231.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.231.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.231.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.232.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.232.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.232.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.233.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.233.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.233.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.234.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.234.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.234.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.235.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.235.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.235.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.236.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.236.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.236.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.237.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.237.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.237.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.238.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.238.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.238.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.239.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.239.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.239.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.24.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.24.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.24.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.240.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.240.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.240.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.241.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.241.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.241.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.242.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.242.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.242.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.243.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.243.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.243.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.244.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.244.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.244.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.245.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.245.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.245.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.246.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.246.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.246.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.247.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.247.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.247.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.248.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.248.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.248.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.249.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.249.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.249.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.25.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.25.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.25.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.250.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.250.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.250.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.251.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.251.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.251.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.252.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.252.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.252.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.253.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.253.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.253.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.254.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.254.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.254.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.255.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.255.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.255.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.26.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.26.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.26.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.27.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.27.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.27.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.28.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.28.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.28.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.29.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.29.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.29.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.3.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.3.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.3.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.30.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.30.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.30.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.31.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.31.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.31.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.32.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.32.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.32.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.33.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.33.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.33.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.34.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.34.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.34.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.35.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.35.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.35.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.36.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.36.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.36.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.37.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.37.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.37.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.38.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.38.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.38.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.39.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.39.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.39.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.4.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.4.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.4.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.40.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.40.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.40.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.41.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.41.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.41.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.42.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.42.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.42.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.43.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.43.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.43.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.44.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.44.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.44.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.45.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.45.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.45.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.46.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.46.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.46.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.47.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.47.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.47.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.48.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.48.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.48.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.49.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.49.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.49.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.5.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.5.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.5.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.50.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.50.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.50.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.51.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.51.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.51.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.52.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.52.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.52.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.53.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.53.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.53.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.54.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.54.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.54.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.55.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.55.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.55.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.56.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.56.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.56.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.57.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.57.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.57.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.58.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.58.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.58.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.59.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.59.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.59.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.6.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.6.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.6.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.60.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.60.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.60.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.61.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.61.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.61.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.62.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.62.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.62.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.63.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.63.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.63.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.64.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.64.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.64.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.65.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.65.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.65.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.66.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.66.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.66.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.67.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.67.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.67.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.68.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.68.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.68.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.69.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.69.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.69.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.7.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.7.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.7.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.70.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.70.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.70.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.71.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.71.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.71.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.72.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.72.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.72.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.73.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.73.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.73.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.74.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.74.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.74.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.75.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.75.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.75.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.76.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.76.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.76.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.77.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.77.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.77.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.78.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.78.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.78.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.79.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.79.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.79.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.8.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.8.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.8.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.80.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.80.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.80.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.81.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.81.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.81.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.82.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.82.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.82.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.83.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.83.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.83.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.84.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.84.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.84.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.85.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.85.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.85.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.86.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.86.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.86.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.87.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.87.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.87.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.88.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.88.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.88.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.89.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.89.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.89.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.9.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.9.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.9.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.90.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.90.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.90.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.91.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.91.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.91.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.92.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.92.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.92.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.93.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.93.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.93.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.94.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.94.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.94.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.95.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.95.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.95.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.96.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.96.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.96.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.97.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.97.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.97.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.98.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.98.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.98.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.99.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.99.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.down_proj_list.99.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.0.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.0.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.0.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.1.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.1.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.1.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.10.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.10.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.10.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.100.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.100.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.100.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.101.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.101.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.101.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.102.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.102.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.102.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.103.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.103.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.103.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.104.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.104.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.104.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.105.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.105.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.105.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.106.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.106.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.106.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.107.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.107.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.107.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.108.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.108.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.108.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.109.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.109.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.109.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.11.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.11.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.11.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.110.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.110.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.110.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.111.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.111.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.111.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.112.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.112.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.112.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.113.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.113.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.113.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.114.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.114.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.114.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.115.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.115.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.115.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.116.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.116.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.116.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.117.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.117.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.117.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.118.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.118.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.118.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.119.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.119.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.119.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.12.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.12.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.12.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.120.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.120.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.120.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.121.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.121.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.121.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.122.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.122.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.122.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.123.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.123.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.123.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.124.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.124.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.124.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.125.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.125.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.125.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.126.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.126.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.126.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.127.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.127.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.127.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.128.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.128.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.128.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.129.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.129.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.129.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.13.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.13.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.13.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.130.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.130.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.130.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.131.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.131.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.131.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.132.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.132.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.132.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.133.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.133.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.133.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.134.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.134.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.134.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.135.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.135.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.135.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.136.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.136.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.136.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.137.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.137.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.137.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.138.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.138.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.138.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.139.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.139.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.139.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.14.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.14.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.14.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.140.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.140.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.140.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.141.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.141.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.141.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.142.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.142.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.142.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.143.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.143.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.143.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.144.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.144.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.144.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.145.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.145.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.145.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.146.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.146.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.146.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.147.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.147.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.147.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.148.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.148.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.148.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.149.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.149.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.149.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.15.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.15.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.15.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.150.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.150.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.150.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.151.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.151.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.151.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.152.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.152.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.152.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.153.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.153.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.153.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.154.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.154.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.154.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.155.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.155.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.155.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.156.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.156.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.156.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.157.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.157.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.157.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.158.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.158.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.158.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.159.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.159.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.159.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.16.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.16.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.16.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.160.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.160.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.160.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.161.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.161.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.161.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.162.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.162.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.162.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.163.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.163.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.163.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.164.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.164.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.164.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.165.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.165.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.165.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.166.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.166.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.166.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.167.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.167.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.167.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.168.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.168.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.168.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.169.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.169.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.169.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.17.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.17.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.17.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.170.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.170.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.170.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.171.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.171.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.171.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.172.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.172.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.172.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.173.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.173.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.173.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.174.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.174.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.174.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.175.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.175.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.175.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.176.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.176.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.176.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.177.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.177.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.177.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.178.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.178.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.178.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.179.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.179.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.179.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.18.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.18.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.18.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.180.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.180.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.180.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.181.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.181.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.181.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.182.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.182.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.182.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.183.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.183.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.183.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.184.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.184.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.184.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.185.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.185.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.185.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.186.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.186.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.186.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.187.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.187.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.187.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.188.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.188.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.188.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.189.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.189.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.189.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.19.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.19.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.19.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.190.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.190.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.190.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.191.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.191.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.191.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.192.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.192.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.192.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.193.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.193.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.193.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.194.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.194.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.194.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.195.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.195.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.195.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.196.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.196.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.196.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.197.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.197.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.197.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.198.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.198.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.198.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.199.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.199.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.199.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.2.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.2.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.2.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.20.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.20.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.20.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.200.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.200.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.200.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.201.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.201.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.201.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.202.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.202.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.202.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.203.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.203.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.203.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.204.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.204.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.204.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.205.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.205.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.205.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.206.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.206.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.206.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.207.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.207.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.207.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.208.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.208.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.208.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.209.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.209.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.209.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.21.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.21.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.21.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.210.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.210.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.210.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.211.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.211.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.211.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.212.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.212.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.212.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.213.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.213.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.213.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.214.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.214.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.214.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.215.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.215.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.215.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.216.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.216.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.216.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.217.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.217.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.217.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.218.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.218.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.218.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.219.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.219.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.219.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.22.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.22.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.22.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.220.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.220.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.220.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.221.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.221.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.221.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.222.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.222.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.222.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.223.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.223.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.223.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.224.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.224.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.224.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.225.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.225.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.225.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.226.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.226.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.226.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.227.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.227.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.227.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.228.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.228.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.228.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.229.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.229.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.229.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.23.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.23.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.23.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.230.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.230.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.230.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.231.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.231.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.231.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.232.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.232.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.232.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.233.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.233.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.233.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.234.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.234.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.234.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.235.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.235.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.235.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.236.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.236.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.236.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.237.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.237.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.237.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.238.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.238.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.238.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.239.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.239.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.239.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.24.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.24.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.24.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.240.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.240.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.240.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.241.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.241.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.241.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.242.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.242.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.242.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.243.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.243.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.243.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.244.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.244.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.244.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.245.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.245.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.245.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.246.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.246.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.246.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.247.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.247.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.247.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.248.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.248.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.248.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.249.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.249.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.249.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.25.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.25.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.25.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.250.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.250.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.250.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.251.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.251.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.251.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.252.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.252.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.252.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.253.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.253.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.253.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.254.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.254.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.254.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.255.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.255.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.255.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.26.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.26.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.26.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.27.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.27.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.27.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.28.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.28.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.28.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.29.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.29.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.29.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.3.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.3.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.3.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.30.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.30.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.30.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.31.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.31.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.31.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.32.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.32.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.32.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.33.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.33.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.33.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.34.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.34.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.34.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.35.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.35.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.35.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.36.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.36.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.36.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.37.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.37.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.37.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.38.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.38.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.38.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.39.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.39.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.39.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.4.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.4.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.4.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.40.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.40.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.40.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.41.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.41.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.41.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.42.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.42.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.42.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.43.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.43.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.43.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.44.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.44.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.44.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.45.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.45.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.45.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.46.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.46.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.46.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.47.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.47.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.47.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.48.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.48.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.48.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.49.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.49.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.49.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.5.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.5.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.5.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.50.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.50.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.50.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.51.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.51.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.51.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.52.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.52.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.52.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.53.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.53.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.53.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.54.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.54.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.54.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.55.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.55.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.55.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.56.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.56.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.56.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.57.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.57.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.57.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.58.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.58.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.58.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.59.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.59.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.59.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.6.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.6.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.6.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.60.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.60.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.60.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.61.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.61.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.61.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.62.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.62.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.62.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.63.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.63.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.63.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.64.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.64.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.64.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.65.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.65.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.65.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.66.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.66.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.66.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.67.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.67.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.67.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.68.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.68.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.68.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.69.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.69.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.69.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.7.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.7.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.7.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.70.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.70.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.70.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.71.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.71.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.71.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.72.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.72.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.72.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.73.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.73.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.73.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.74.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.74.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.74.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.75.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.75.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.75.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.76.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.76.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.76.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.77.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.77.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.77.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.78.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.78.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.78.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.79.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.79.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.79.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.8.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.8.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.8.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.80.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.80.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.80.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.81.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.81.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.81.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.82.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.82.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.82.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.83.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.83.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.83.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.84.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.84.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.84.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.85.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.85.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.85.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.86.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.86.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.86.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.87.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.87.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.87.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.88.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.88.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.88.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.89.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.89.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.89.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.9.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.9.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.9.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.90.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.90.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.90.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.91.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.91.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.91.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.92.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.92.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.92.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.93.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.93.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.93.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.94.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.94.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.94.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.95.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.95.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.95.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.96.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.96.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.96.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.97.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.97.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.97.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.98.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.98.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.98.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.99.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.99.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.experts.gate_up_proj_list.99.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.gate.weight": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.shared_expert.down_proj.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.shared_expert.down_proj.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.shared_expert.down_proj.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.shared_expert.gate_proj.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.shared_expert.gate_proj.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.shared_expert.gate_proj.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.shared_expert.up_proj.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.shared_expert.up_proj.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.shared_expert.up_proj.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.shared_expert_gate.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.shared_expert_gate.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.mlp.shared_expert_gate.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.post_attention_layernorm.weight": "model-00001-of-00004.safetensors", "model.language_model.layers.7.self_attn.k_norm.weight": "model-00001-of-00004.safetensors", "model.language_model.layers.7.self_attn.k_proj.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.self_attn.k_proj.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.self_attn.k_proj.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.self_attn.o_proj.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.self_attn.o_proj.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.self_attn.o_proj.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.self_attn.q_norm.weight": "model-00001-of-00004.safetensors", "model.language_model.layers.7.self_attn.q_proj.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.self_attn.q_proj.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.self_attn.q_proj.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.7.self_attn.v_proj.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.7.self_attn.v_proj.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.7.self_attn.v_proj.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.input_layernorm.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.8.linear_attn.A_log": "model-00001-of-00004.safetensors", "model.language_model.layers.8.linear_attn.conv1d.weight": "model-00001-of-00004.safetensors", "model.language_model.layers.8.linear_attn.dt_bias": "model-00001-of-00004.safetensors", "model.language_model.layers.8.linear_attn.in_proj_a.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.linear_attn.in_proj_a.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.linear_attn.in_proj_a.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.linear_attn.in_proj_b.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.linear_attn.in_proj_b.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.linear_attn.in_proj_b.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.linear_attn.in_proj_qkv.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.linear_attn.in_proj_qkv.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.linear_attn.in_proj_qkv.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.linear_attn.in_proj_z.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.linear_attn.in_proj_z.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.linear_attn.in_proj_z.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.linear_attn.norm.weight": "model-00001-of-00004.safetensors", "model.language_model.layers.8.linear_attn.out_proj.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.linear_attn.out_proj.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.linear_attn.out_proj.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.0.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.0.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.0.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.1.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.1.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.1.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.10.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.10.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.10.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.100.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.100.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.100.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.101.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.101.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.101.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.102.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.102.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.102.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.103.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.103.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.103.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.104.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.104.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.104.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.105.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.105.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.105.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.106.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.106.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.106.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.107.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.107.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.107.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.108.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.108.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.108.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.109.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.109.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.109.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.11.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.11.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.11.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.110.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.110.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.110.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.111.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.111.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.111.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.112.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.112.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.112.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.113.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.113.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.113.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.114.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.114.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.114.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.115.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.115.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.115.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.116.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.116.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.116.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.117.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.117.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.117.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.118.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.118.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.118.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.119.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.119.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.119.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.12.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.12.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.12.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.120.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.120.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.120.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.121.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.121.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.121.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.122.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.122.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.122.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.123.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.123.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.123.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.124.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.124.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.124.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.125.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.125.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.125.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.126.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.126.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.126.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.127.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.127.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.127.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.128.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.128.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.128.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.129.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.129.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.129.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.13.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.13.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.13.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.130.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.130.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.130.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.131.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.131.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.131.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.132.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.132.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.132.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.133.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.133.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.133.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.134.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.134.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.134.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.135.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.135.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.135.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.136.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.136.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.136.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.137.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.137.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.137.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.138.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.138.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.138.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.139.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.139.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.139.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.14.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.14.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.14.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.140.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.140.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.140.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.141.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.141.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.141.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.142.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.142.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.142.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.143.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.143.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.143.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.144.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.144.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.144.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.145.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.145.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.145.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.146.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.146.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.146.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.147.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.147.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.147.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.148.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.148.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.148.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.149.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.149.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.149.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.15.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.15.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.15.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.150.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.150.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.150.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.151.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.151.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.151.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.152.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.152.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.152.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.153.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.153.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.153.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.154.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.154.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.154.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.155.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.155.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.155.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.156.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.156.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.156.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.157.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.157.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.157.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.158.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.158.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.158.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.159.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.159.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.159.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.16.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.16.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.16.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.160.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.160.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.160.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.161.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.161.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.161.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.162.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.162.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.162.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.163.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.163.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.163.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.164.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.164.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.164.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.165.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.165.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.165.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.166.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.166.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.166.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.167.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.167.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.167.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.168.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.168.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.168.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.169.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.169.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.169.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.17.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.17.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.17.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.170.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.170.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.170.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.171.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.171.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.171.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.172.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.172.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.172.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.173.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.173.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.173.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.174.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.174.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.174.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.175.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.175.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.175.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.176.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.176.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.176.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.177.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.177.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.177.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.178.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.178.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.178.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.179.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.179.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.179.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.18.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.18.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.18.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.180.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.180.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.180.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.181.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.181.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.181.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.182.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.182.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.182.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.183.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.183.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.183.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.184.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.184.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.184.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.185.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.185.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.185.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.186.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.186.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.186.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.187.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.187.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.187.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.188.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.188.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.188.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.189.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.189.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.189.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.19.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.19.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.19.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.190.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.190.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.190.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.191.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.191.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.191.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.192.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.192.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.192.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.193.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.193.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.193.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.194.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.194.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.194.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.195.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.195.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.195.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.196.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.196.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.196.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.197.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.197.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.197.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.198.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.198.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.198.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.199.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.199.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.199.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.2.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.2.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.2.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.20.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.20.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.20.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.200.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.200.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.200.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.201.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.201.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.201.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.202.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.202.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.202.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.203.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.203.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.203.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.204.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.204.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.204.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.205.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.205.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.205.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.206.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.206.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.206.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.207.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.207.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.207.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.208.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.208.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.208.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.209.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.209.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.209.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.21.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.21.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.21.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.210.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.210.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.210.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.211.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.211.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.211.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.212.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.212.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.212.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.213.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.213.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.213.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.214.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.214.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.214.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.215.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.215.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.215.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.216.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.216.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.216.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.217.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.217.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.217.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.218.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.218.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.218.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.219.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.219.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.219.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.22.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.22.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.22.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.220.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.220.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.220.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.221.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.221.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.221.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.222.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.222.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.222.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.223.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.223.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.223.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.224.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.224.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.224.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.225.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.225.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.225.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.226.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.226.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.226.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.227.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.227.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.227.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.228.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.228.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.228.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.229.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.229.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.229.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.23.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.23.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.23.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.230.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.230.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.230.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.231.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.231.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.231.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.232.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.232.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.232.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.233.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.233.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.233.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.234.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.234.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.234.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.235.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.235.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.235.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.236.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.236.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.236.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.237.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.237.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.237.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.238.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.238.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.238.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.239.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.239.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.239.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.24.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.24.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.24.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.240.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.240.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.240.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.241.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.241.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.241.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.242.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.242.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.242.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.243.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.243.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.243.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.244.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.244.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.244.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.245.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.245.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.245.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.246.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.246.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.246.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.247.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.247.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.247.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.248.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.248.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.248.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.249.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.249.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.249.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.25.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.25.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.25.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.250.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.250.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.250.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.251.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.251.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.251.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.252.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.252.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.252.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.253.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.253.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.253.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.254.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.254.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.254.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.255.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.255.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.255.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.26.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.26.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.26.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.27.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.27.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.27.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.28.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.28.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.28.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.29.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.29.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.29.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.3.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.3.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.3.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.30.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.30.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.30.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.31.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.31.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.31.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.32.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.32.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.32.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.33.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.33.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.33.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.34.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.34.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.34.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.35.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.35.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.35.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.36.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.36.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.36.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.37.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.37.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.37.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.38.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.38.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.38.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.39.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.39.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.39.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.4.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.4.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.4.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.40.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.40.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.40.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.41.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.41.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.41.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.42.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.42.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.42.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.43.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.43.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.43.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.44.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.44.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.44.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.45.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.45.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.45.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.46.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.46.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.46.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.47.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.47.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.47.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.48.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.48.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.48.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.49.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.49.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.49.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.5.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.5.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.5.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.50.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.50.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.50.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.51.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.51.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.51.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.52.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.52.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.52.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.53.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.53.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.53.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.54.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.54.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.54.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.55.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.55.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.55.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.56.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.56.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.56.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.57.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.57.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.57.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.58.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.58.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.58.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.59.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.59.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.59.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.6.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.6.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.6.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.60.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.60.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.60.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.61.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.61.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.61.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.62.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.62.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.62.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.63.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.63.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.63.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.64.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.64.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.64.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.65.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.65.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.65.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.66.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.66.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.66.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.67.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.67.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.67.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.68.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.68.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.68.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.69.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.69.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.69.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.7.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.7.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.7.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.70.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.70.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.70.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.71.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.71.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.71.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.72.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.72.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.72.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.73.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.73.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.73.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.74.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.74.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.74.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.75.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.75.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.75.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.76.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.76.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.76.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.77.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.77.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.77.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.78.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.78.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.78.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.79.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.79.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.79.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.8.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.8.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.8.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.80.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.80.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.80.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.81.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.81.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.81.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.82.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.82.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.82.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.83.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.83.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.83.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.84.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.84.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.84.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.85.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.85.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.85.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.86.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.86.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.86.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.87.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.87.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.87.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.88.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.88.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.88.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.89.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.89.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.89.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.9.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.9.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.9.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.90.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.90.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.90.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.91.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.91.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.91.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.92.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.92.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.92.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.93.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.93.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.93.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.94.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.94.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.94.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.95.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.95.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.95.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.96.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.96.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.96.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.97.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.97.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.97.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.98.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.98.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.98.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.99.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.99.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.down_proj_list.99.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.0.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.0.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.0.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.1.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.1.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.1.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.10.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.10.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.10.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.100.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.100.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.100.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.101.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.101.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.101.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.102.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.102.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.102.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.103.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.103.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.103.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.104.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.104.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.104.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.105.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.105.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.105.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.106.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.106.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.106.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.107.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.107.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.107.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.108.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.108.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.108.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.109.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.109.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.109.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.11.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.11.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.11.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.110.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.110.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.110.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.111.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.111.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.111.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.112.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.112.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.112.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.113.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.113.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.113.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.114.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.114.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.114.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.115.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.115.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.115.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.116.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.116.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.116.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.117.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.117.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.117.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.118.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.118.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.118.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.119.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.119.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.119.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.12.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.12.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.12.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.120.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.120.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.120.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.121.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.121.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.121.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.122.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.122.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.122.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.123.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.123.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.123.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.124.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.124.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.124.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.125.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.125.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.125.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.126.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.126.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.126.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.127.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.127.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.127.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.128.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.128.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.128.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.129.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.129.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.129.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.13.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.13.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.13.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.130.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.130.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.130.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.131.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.131.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.131.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.132.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.132.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.132.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.133.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.133.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.133.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.134.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.134.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.134.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.135.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.135.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.135.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.136.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.136.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.136.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.137.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.137.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.137.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.138.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.138.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.138.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.139.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.139.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.139.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.14.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.14.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.14.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.140.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.140.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.140.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.141.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.141.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.141.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.142.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.142.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.142.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.143.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.143.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.143.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.144.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.144.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.144.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.145.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.145.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.145.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.146.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.146.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.146.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.147.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.147.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.147.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.148.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.148.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.148.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.149.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.149.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.149.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.15.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.15.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.15.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.150.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.150.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.150.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.151.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.151.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.151.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.152.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.152.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.152.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.153.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.153.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.153.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.154.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.154.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.154.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.155.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.155.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.155.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.156.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.156.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.156.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.157.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.157.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.157.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.158.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.158.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.158.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.159.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.159.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.159.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.16.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.16.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.16.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.160.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.160.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.160.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.161.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.161.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.161.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.162.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.162.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.162.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.163.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.163.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.163.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.164.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.164.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.164.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.165.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.165.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.165.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.166.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.166.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.166.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.167.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.167.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.167.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.168.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.168.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.168.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.169.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.169.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.169.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.17.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.17.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.17.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.170.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.170.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.170.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.171.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.171.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.171.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.172.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.172.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.172.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.173.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.173.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.173.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.174.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.174.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.174.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.175.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.175.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.175.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.176.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.176.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.176.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.177.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.177.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.177.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.178.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.178.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.178.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.179.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.179.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.179.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.18.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.18.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.18.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.180.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.180.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.180.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.181.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.181.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.181.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.182.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.182.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.182.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.183.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.183.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.183.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.184.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.184.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.184.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.185.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.185.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.185.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.186.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.186.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.186.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.187.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.187.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.187.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.188.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.188.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.188.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.189.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.189.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.189.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.19.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.19.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.19.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.190.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.190.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.190.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.191.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.191.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.191.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.192.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.192.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.192.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.193.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.193.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.193.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.194.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.194.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.194.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.195.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.195.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.195.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.196.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.196.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.196.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.197.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.197.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.197.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.198.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.198.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.198.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.199.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.199.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.199.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.2.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.2.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.2.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.20.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.20.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.20.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.200.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.200.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.200.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.201.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.201.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.201.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.202.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.202.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.202.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.203.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.203.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.203.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.204.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.204.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.204.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.205.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.205.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.205.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.206.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.206.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.206.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.207.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.207.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.207.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.208.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.208.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.208.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.209.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.209.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.209.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.21.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.21.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.21.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.210.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.210.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.210.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.211.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.211.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.211.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.212.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.212.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.212.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.213.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.213.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.213.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.214.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.214.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.214.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.215.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.215.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.215.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.216.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.216.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.216.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.217.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.217.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.217.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.218.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.218.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.218.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.219.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.219.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.219.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.22.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.22.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.22.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.220.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.220.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.220.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.221.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.221.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.221.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.222.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.222.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.222.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.223.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.223.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.223.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.224.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.224.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.224.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.225.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.225.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.225.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.226.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.226.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.226.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.227.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.227.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.227.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.228.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.228.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.228.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.229.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.229.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.229.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.23.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.23.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.23.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.230.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.230.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.230.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.231.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.231.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.231.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.232.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.232.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.232.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.233.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.233.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.233.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.234.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.234.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.234.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.235.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.235.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.235.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.236.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.236.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.236.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.237.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.237.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.237.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.238.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.238.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.238.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.239.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.239.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.239.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.24.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.24.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.24.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.240.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.240.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.240.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.241.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.241.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.241.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.242.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.242.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.242.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.243.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.243.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.243.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.244.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.244.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.244.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.245.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.245.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.245.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.246.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.246.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.246.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.247.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.247.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.247.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.248.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.248.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.248.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.249.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.249.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.249.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.25.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.25.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.25.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.250.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.250.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.250.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.251.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.251.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.251.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.252.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.252.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.252.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.253.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.253.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.253.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.254.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.254.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.254.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.255.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.255.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.255.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.26.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.26.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.26.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.27.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.27.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.27.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.28.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.28.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.28.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.29.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.29.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.29.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.3.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.3.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.3.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.30.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.30.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.30.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.31.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.31.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.31.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.32.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.32.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.32.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.33.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.33.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.33.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.34.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.34.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.34.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.35.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.35.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.35.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.36.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.36.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.36.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.37.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.37.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.37.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.38.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.38.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.38.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.39.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.39.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.39.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.4.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.4.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.4.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.40.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.40.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.40.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.41.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.41.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.41.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.42.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.42.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.42.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.43.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.43.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.43.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.44.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.44.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.44.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.45.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.45.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.45.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.46.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.46.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.46.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.47.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.47.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.47.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.48.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.48.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.48.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.49.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.49.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.49.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.5.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.5.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.5.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.50.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.50.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.50.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.51.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.51.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.51.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.52.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.52.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.52.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.53.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.53.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.53.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.54.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.54.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.54.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.55.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.55.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.55.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.56.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.56.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.56.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.57.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.57.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.57.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.58.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.58.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.58.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.59.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.59.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.59.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.6.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.6.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.6.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.60.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.60.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.60.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.61.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.61.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.61.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.62.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.62.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.62.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.63.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.63.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.63.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.64.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.64.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.64.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.65.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.65.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.65.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.66.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.66.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.66.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.67.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.67.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.67.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.68.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.68.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.68.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.69.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.69.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.69.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.7.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.7.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.7.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.70.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.70.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.70.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.71.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.71.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.71.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.72.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.72.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.72.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.73.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.73.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.73.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.74.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.74.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.74.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.75.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.75.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.75.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.76.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.76.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.76.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.77.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.77.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.77.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.78.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.78.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.78.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.79.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.79.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.79.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.8.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.8.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.8.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.80.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.80.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.80.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.81.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.81.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.81.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.82.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.82.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.82.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.83.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.83.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.83.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.84.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.84.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.84.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.85.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.85.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.85.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.86.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.86.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.86.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.87.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.87.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.87.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.88.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.88.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.88.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.89.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.89.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.89.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.9.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.9.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.9.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.90.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.90.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.90.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.91.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.91.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.91.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.92.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.92.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.92.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.93.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.93.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.93.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.94.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.94.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.94.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.95.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.95.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.95.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.96.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.96.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.96.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.97.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.97.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.97.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.98.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.98.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.98.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.99.W_q_packed": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.99.scale": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.experts.gate_up_proj_list.99.zero": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.gate.weight": "model-00001-of-00004.safetensors", "model.language_model.layers.8.mlp.shared_expert.down_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.shared_expert.down_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.shared_expert.down_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.shared_expert.gate_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.shared_expert.gate_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.shared_expert.gate_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.shared_expert.up_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.shared_expert.up_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.shared_expert.up_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.shared_expert_gate.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.shared_expert_gate.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.8.mlp.shared_expert_gate.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.8.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.9.input_layernorm.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.9.linear_attn.A_log": "model-00002-of-00004.safetensors", "model.language_model.layers.9.linear_attn.conv1d.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.9.linear_attn.dt_bias": "model-00002-of-00004.safetensors", "model.language_model.layers.9.linear_attn.in_proj_a.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.linear_attn.in_proj_a.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.linear_attn.in_proj_a.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.linear_attn.in_proj_b.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.linear_attn.in_proj_b.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.linear_attn.in_proj_b.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.linear_attn.in_proj_qkv.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.linear_attn.in_proj_qkv.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.linear_attn.in_proj_qkv.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.linear_attn.in_proj_z.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.linear_attn.in_proj_z.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.linear_attn.in_proj_z.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.linear_attn.norm.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.9.linear_attn.out_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.linear_attn.out_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.linear_attn.out_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.0.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.0.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.0.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.1.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.1.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.1.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.10.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.10.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.10.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.100.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.100.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.100.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.101.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.101.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.101.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.102.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.102.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.102.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.103.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.103.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.103.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.104.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.104.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.104.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.105.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.105.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.105.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.106.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.106.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.106.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.107.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.107.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.107.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.108.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.108.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.108.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.109.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.109.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.109.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.11.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.11.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.11.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.110.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.110.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.110.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.111.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.111.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.111.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.112.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.112.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.112.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.113.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.113.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.113.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.114.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.114.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.114.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.115.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.115.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.115.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.116.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.116.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.116.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.117.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.117.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.117.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.118.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.118.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.118.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.119.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.119.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.119.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.12.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.12.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.12.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.120.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.120.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.120.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.121.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.121.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.121.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.122.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.122.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.122.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.123.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.123.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.123.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.124.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.124.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.124.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.125.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.125.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.125.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.126.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.126.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.126.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.127.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.127.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.127.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.128.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.128.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.128.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.129.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.129.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.129.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.13.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.13.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.13.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.130.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.130.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.130.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.131.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.131.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.131.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.132.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.132.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.132.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.133.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.133.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.133.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.134.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.134.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.134.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.135.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.135.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.135.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.136.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.136.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.136.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.137.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.137.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.137.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.138.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.138.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.138.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.139.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.139.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.139.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.14.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.14.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.14.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.140.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.140.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.140.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.141.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.141.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.141.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.142.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.142.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.142.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.143.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.143.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.143.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.144.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.144.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.144.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.145.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.145.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.145.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.146.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.146.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.146.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.147.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.147.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.147.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.148.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.148.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.148.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.149.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.149.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.149.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.15.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.15.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.15.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.150.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.150.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.150.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.151.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.151.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.151.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.152.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.152.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.152.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.153.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.153.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.153.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.154.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.154.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.154.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.155.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.155.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.155.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.156.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.156.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.156.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.157.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.157.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.157.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.158.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.158.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.158.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.159.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.159.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.159.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.16.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.16.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.16.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.160.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.160.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.160.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.161.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.161.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.161.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.162.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.162.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.162.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.163.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.163.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.163.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.164.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.164.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.164.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.165.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.165.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.165.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.166.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.166.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.166.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.167.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.167.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.167.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.168.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.168.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.168.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.169.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.169.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.169.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.17.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.17.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.17.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.170.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.170.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.170.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.171.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.171.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.171.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.172.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.172.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.172.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.173.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.173.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.173.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.174.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.174.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.174.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.175.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.175.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.175.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.176.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.176.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.176.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.177.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.177.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.177.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.178.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.178.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.178.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.179.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.179.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.179.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.18.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.18.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.18.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.180.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.180.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.180.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.181.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.181.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.181.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.182.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.182.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.182.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.183.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.183.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.183.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.184.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.184.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.184.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.185.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.185.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.185.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.186.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.186.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.186.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.187.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.187.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.187.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.188.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.188.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.188.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.189.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.189.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.189.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.19.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.19.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.19.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.190.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.190.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.190.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.191.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.191.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.191.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.192.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.192.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.192.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.193.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.193.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.193.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.194.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.194.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.194.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.195.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.195.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.195.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.196.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.196.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.196.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.197.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.197.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.197.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.198.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.198.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.198.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.199.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.199.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.199.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.2.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.2.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.2.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.20.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.20.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.20.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.200.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.200.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.200.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.201.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.201.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.201.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.202.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.202.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.202.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.203.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.203.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.203.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.204.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.204.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.204.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.205.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.205.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.205.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.206.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.206.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.206.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.207.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.207.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.207.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.208.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.208.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.208.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.209.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.209.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.209.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.21.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.21.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.21.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.210.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.210.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.210.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.211.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.211.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.211.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.212.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.212.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.212.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.213.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.213.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.213.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.214.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.214.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.214.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.215.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.215.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.215.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.216.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.216.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.216.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.217.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.217.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.217.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.218.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.218.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.218.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.219.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.219.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.219.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.22.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.22.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.22.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.220.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.220.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.220.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.221.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.221.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.221.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.222.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.222.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.222.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.223.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.223.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.223.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.224.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.224.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.224.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.225.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.225.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.225.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.226.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.226.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.226.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.227.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.227.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.227.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.228.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.228.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.228.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.229.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.229.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.229.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.23.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.23.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.23.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.230.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.230.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.230.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.231.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.231.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.231.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.232.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.232.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.232.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.233.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.233.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.233.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.234.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.234.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.234.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.235.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.235.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.235.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.236.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.236.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.236.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.237.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.237.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.237.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.238.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.238.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.238.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.239.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.239.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.239.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.24.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.24.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.24.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.240.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.240.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.240.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.241.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.241.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.241.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.242.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.242.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.242.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.243.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.243.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.243.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.244.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.244.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.244.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.245.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.245.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.245.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.246.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.246.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.246.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.247.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.247.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.247.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.248.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.248.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.248.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.249.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.249.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.249.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.25.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.25.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.25.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.250.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.250.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.250.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.251.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.251.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.251.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.252.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.252.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.252.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.253.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.253.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.253.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.254.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.254.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.254.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.255.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.255.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.255.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.26.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.26.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.26.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.27.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.27.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.27.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.28.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.28.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.28.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.29.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.29.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.29.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.3.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.3.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.3.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.30.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.30.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.30.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.31.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.31.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.31.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.32.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.32.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.32.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.33.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.33.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.33.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.34.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.34.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.34.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.35.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.35.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.35.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.36.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.36.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.36.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.37.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.37.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.37.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.38.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.38.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.38.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.39.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.39.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.39.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.4.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.4.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.4.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.40.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.40.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.40.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.41.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.41.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.41.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.42.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.42.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.42.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.43.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.43.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.43.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.44.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.44.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.44.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.45.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.45.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.45.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.46.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.46.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.46.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.47.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.47.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.47.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.48.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.48.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.48.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.49.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.49.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.49.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.5.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.5.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.5.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.50.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.50.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.50.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.51.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.51.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.51.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.52.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.52.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.52.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.53.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.53.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.53.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.54.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.54.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.54.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.55.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.55.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.55.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.56.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.56.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.56.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.57.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.57.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.57.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.58.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.58.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.58.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.59.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.59.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.59.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.6.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.6.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.6.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.60.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.60.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.60.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.61.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.61.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.61.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.62.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.62.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.62.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.63.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.63.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.63.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.64.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.64.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.64.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.65.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.65.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.65.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.66.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.66.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.66.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.67.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.67.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.67.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.68.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.68.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.68.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.69.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.69.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.69.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.7.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.7.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.7.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.70.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.70.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.70.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.71.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.71.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.71.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.72.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.72.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.72.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.73.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.73.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.73.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.74.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.74.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.74.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.75.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.75.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.75.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.76.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.76.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.76.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.77.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.77.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.77.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.78.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.78.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.78.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.79.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.79.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.79.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.8.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.8.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.8.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.80.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.80.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.80.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.81.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.81.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.81.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.82.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.82.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.82.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.83.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.83.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.83.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.84.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.84.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.84.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.85.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.85.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.85.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.86.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.86.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.86.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.87.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.87.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.87.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.88.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.88.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.88.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.89.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.89.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.89.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.9.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.9.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.9.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.90.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.90.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.90.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.91.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.91.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.91.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.92.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.92.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.92.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.93.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.93.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.93.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.94.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.94.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.94.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.95.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.95.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.95.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.96.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.96.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.96.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.97.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.97.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.97.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.98.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.98.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.98.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.99.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.99.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.down_proj_list.99.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.0.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.0.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.0.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.1.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.1.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.1.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.10.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.10.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.10.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.100.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.100.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.100.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.101.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.101.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.101.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.102.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.102.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.102.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.103.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.103.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.103.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.104.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.104.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.104.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.105.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.105.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.105.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.106.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.106.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.106.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.107.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.107.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.107.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.108.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.108.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.108.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.109.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.109.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.109.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.11.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.11.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.11.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.110.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.110.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.110.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.111.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.111.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.111.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.112.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.112.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.112.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.113.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.113.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.113.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.114.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.114.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.114.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.115.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.115.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.115.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.116.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.116.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.116.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.117.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.117.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.117.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.118.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.118.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.118.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.119.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.119.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.119.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.12.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.12.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.12.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.120.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.120.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.120.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.121.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.121.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.121.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.122.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.122.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.122.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.123.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.123.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.123.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.124.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.124.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.124.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.125.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.125.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.125.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.126.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.126.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.126.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.127.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.127.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.127.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.128.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.128.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.128.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.129.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.129.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.129.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.13.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.13.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.13.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.130.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.130.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.130.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.131.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.131.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.131.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.132.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.132.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.132.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.133.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.133.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.133.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.134.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.134.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.134.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.135.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.135.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.135.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.136.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.136.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.136.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.137.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.137.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.137.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.138.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.138.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.138.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.139.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.139.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.139.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.14.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.14.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.14.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.140.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.140.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.140.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.141.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.141.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.141.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.142.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.142.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.142.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.143.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.143.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.143.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.144.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.144.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.144.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.145.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.145.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.145.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.146.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.146.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.146.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.147.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.147.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.147.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.148.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.148.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.148.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.149.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.149.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.149.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.15.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.15.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.15.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.150.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.150.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.150.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.151.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.151.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.151.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.152.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.152.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.152.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.153.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.153.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.153.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.154.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.154.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.154.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.155.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.155.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.155.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.156.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.156.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.156.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.157.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.157.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.157.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.158.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.158.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.158.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.159.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.159.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.159.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.16.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.16.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.16.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.160.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.160.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.160.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.161.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.161.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.161.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.162.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.162.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.162.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.163.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.163.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.163.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.164.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.164.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.164.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.165.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.165.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.165.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.166.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.166.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.166.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.167.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.167.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.167.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.168.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.168.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.168.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.169.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.169.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.169.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.17.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.17.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.17.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.170.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.170.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.170.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.171.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.171.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.171.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.172.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.172.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.172.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.173.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.173.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.173.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.174.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.174.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.174.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.175.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.175.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.175.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.176.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.176.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.176.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.177.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.177.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.177.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.178.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.178.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.178.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.179.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.179.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.179.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.18.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.18.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.18.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.180.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.180.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.180.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.181.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.181.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.181.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.182.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.182.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.182.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.183.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.183.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.183.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.184.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.184.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.184.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.185.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.185.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.185.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.186.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.186.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.186.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.187.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.187.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.187.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.188.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.188.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.188.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.189.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.189.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.189.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.19.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.19.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.19.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.190.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.190.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.190.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.191.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.191.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.191.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.192.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.192.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.192.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.193.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.193.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.193.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.194.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.194.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.194.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.195.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.195.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.195.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.196.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.196.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.196.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.197.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.197.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.197.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.198.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.198.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.198.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.199.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.199.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.199.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.2.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.2.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.2.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.20.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.20.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.20.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.200.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.200.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.200.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.201.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.201.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.201.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.202.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.202.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.202.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.203.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.203.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.203.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.204.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.204.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.204.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.205.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.205.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.205.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.206.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.206.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.206.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.207.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.207.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.207.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.208.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.208.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.208.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.209.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.209.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.209.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.21.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.21.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.21.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.210.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.210.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.210.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.211.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.211.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.211.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.212.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.212.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.212.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.213.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.213.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.213.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.214.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.214.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.214.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.215.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.215.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.215.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.216.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.216.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.216.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.217.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.217.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.217.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.218.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.218.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.218.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.219.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.219.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.219.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.22.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.22.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.22.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.220.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.220.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.220.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.221.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.221.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.221.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.222.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.222.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.222.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.223.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.223.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.223.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.224.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.224.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.224.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.225.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.225.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.225.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.226.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.226.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.226.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.227.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.227.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.227.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.228.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.228.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.228.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.229.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.229.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.229.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.23.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.23.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.23.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.230.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.230.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.230.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.231.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.231.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.231.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.232.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.232.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.232.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.233.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.233.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.233.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.234.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.234.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.234.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.235.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.235.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.235.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.236.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.236.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.236.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.237.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.237.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.237.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.238.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.238.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.238.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.239.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.239.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.239.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.24.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.24.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.24.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.240.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.240.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.240.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.241.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.241.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.241.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.242.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.242.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.242.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.243.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.243.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.243.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.244.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.244.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.244.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.245.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.245.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.245.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.246.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.246.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.246.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.247.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.247.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.247.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.248.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.248.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.248.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.249.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.249.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.249.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.25.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.25.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.25.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.250.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.250.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.250.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.251.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.251.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.251.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.252.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.252.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.252.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.253.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.253.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.253.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.254.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.254.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.254.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.255.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.255.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.255.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.26.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.26.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.26.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.27.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.27.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.27.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.28.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.28.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.28.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.29.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.29.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.29.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.3.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.3.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.3.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.30.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.30.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.30.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.31.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.31.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.31.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.32.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.32.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.32.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.33.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.33.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.33.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.34.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.34.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.34.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.35.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.35.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.35.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.36.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.36.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.36.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.37.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.37.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.37.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.38.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.38.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.38.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.39.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.39.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.39.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.4.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.4.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.4.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.40.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.40.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.40.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.41.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.41.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.41.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.42.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.42.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.42.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.43.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.43.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.43.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.44.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.44.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.44.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.45.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.45.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.45.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.46.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.46.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.46.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.47.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.47.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.47.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.48.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.48.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.48.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.49.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.49.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.49.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.5.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.5.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.5.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.50.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.50.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.50.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.51.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.51.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.51.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.52.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.52.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.52.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.53.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.53.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.53.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.54.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.54.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.54.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.55.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.55.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.55.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.56.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.56.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.56.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.57.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.57.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.57.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.58.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.58.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.58.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.59.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.59.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.59.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.6.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.6.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.6.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.60.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.60.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.60.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.61.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.61.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.61.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.62.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.62.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.62.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.63.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.63.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.63.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.64.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.64.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.64.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.65.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.65.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.65.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.66.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.66.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.66.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.67.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.67.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.67.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.68.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.68.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.68.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.69.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.69.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.69.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.7.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.7.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.7.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.70.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.70.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.70.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.71.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.71.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.71.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.72.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.72.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.72.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.73.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.73.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.73.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.74.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.74.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.74.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.75.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.75.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.75.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.76.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.76.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.76.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.77.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.77.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.77.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.78.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.78.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.78.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.79.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.79.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.79.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.8.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.8.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.8.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.80.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.80.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.80.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.81.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.81.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.81.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.82.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.82.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.82.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.83.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.83.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.83.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.84.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.84.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.84.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.85.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.85.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.85.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.86.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.86.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.86.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.87.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.87.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.87.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.88.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.88.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.88.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.89.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.89.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.89.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.9.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.9.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.9.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.90.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.90.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.90.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.91.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.91.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.91.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.92.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.92.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.92.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.93.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.93.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.93.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.94.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.94.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.94.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.95.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.95.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.95.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.96.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.96.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.96.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.97.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.97.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.97.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.98.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.98.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.98.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.99.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.99.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.experts.gate_up_proj_list.99.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.gate.weight": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.shared_expert.down_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.shared_expert.down_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.shared_expert.down_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.shared_expert.gate_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.shared_expert.gate_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.shared_expert.gate_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.shared_expert.up_proj.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.shared_expert.up_proj.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.shared_expert.up_proj.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.shared_expert_gate.W_q_packed": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.shared_expert_gate.scale": "model-00002-of-00004.safetensors", "model.language_model.layers.9.mlp.shared_expert_gate.zero": "model-00002-of-00004.safetensors", "model.language_model.layers.9.post_attention_layernorm.weight": "model-00002-of-00004.safetensors", "model.language_model.norm.weight": "model-00004-of-00004.safetensors", "model.visual.blocks.0.attn.proj.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.0.attn.proj.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.0.attn.qkv.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.0.attn.qkv.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.0.mlp.linear_fc1.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.0.mlp.linear_fc1.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.0.mlp.linear_fc2.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.0.mlp.linear_fc2.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.0.norm1.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.0.norm1.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.0.norm2.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.0.norm2.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.1.attn.proj.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.1.attn.proj.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.1.attn.qkv.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.1.attn.qkv.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.1.mlp.linear_fc1.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.1.mlp.linear_fc1.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.1.mlp.linear_fc2.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.1.mlp.linear_fc2.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.1.norm1.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.1.norm1.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.1.norm2.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.1.norm2.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.10.attn.proj.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.10.attn.proj.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.10.attn.qkv.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.10.attn.qkv.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.10.mlp.linear_fc1.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.10.mlp.linear_fc1.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.10.mlp.linear_fc2.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.10.mlp.linear_fc2.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.10.norm1.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.10.norm1.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.10.norm2.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.10.norm2.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.11.attn.proj.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.11.attn.proj.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.11.attn.qkv.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.11.attn.qkv.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.11.mlp.linear_fc1.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.11.mlp.linear_fc1.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.11.mlp.linear_fc2.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.11.mlp.linear_fc2.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.11.norm1.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.11.norm1.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.11.norm2.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.11.norm2.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.12.attn.proj.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.12.attn.proj.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.12.attn.qkv.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.12.attn.qkv.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.12.mlp.linear_fc1.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.12.mlp.linear_fc1.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.12.mlp.linear_fc2.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.12.mlp.linear_fc2.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.12.norm1.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.12.norm1.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.12.norm2.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.12.norm2.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.13.attn.proj.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.13.attn.proj.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.13.attn.qkv.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.13.attn.qkv.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.13.mlp.linear_fc1.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.13.mlp.linear_fc1.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.13.mlp.linear_fc2.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.13.mlp.linear_fc2.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.13.norm1.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.13.norm1.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.13.norm2.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.13.norm2.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.14.attn.proj.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.14.attn.proj.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.14.attn.qkv.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.14.attn.qkv.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.14.mlp.linear_fc1.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.14.mlp.linear_fc1.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.14.mlp.linear_fc2.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.14.mlp.linear_fc2.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.14.norm1.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.14.norm1.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.14.norm2.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.14.norm2.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.15.attn.proj.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.15.attn.proj.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.15.attn.qkv.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.15.attn.qkv.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.15.mlp.linear_fc1.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.15.mlp.linear_fc1.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.15.mlp.linear_fc2.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.15.mlp.linear_fc2.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.15.norm1.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.15.norm1.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.15.norm2.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.15.norm2.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.16.attn.proj.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.16.attn.proj.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.16.attn.qkv.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.16.attn.qkv.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.16.mlp.linear_fc1.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.16.mlp.linear_fc1.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.16.mlp.linear_fc2.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.16.mlp.linear_fc2.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.16.norm1.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.16.norm1.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.16.norm2.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.16.norm2.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.17.attn.proj.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.17.attn.proj.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.17.attn.qkv.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.17.attn.qkv.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.17.mlp.linear_fc1.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.17.mlp.linear_fc1.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.17.mlp.linear_fc2.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.17.mlp.linear_fc2.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.17.norm1.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.17.norm1.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.17.norm2.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.17.norm2.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.18.attn.proj.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.18.attn.proj.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.18.attn.qkv.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.18.attn.qkv.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.18.mlp.linear_fc1.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.18.mlp.linear_fc1.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.18.mlp.linear_fc2.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.18.mlp.linear_fc2.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.18.norm1.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.18.norm1.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.18.norm2.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.18.norm2.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.19.attn.proj.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.19.attn.proj.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.19.attn.qkv.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.19.attn.qkv.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.19.mlp.linear_fc1.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.19.mlp.linear_fc1.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.19.mlp.linear_fc2.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.19.mlp.linear_fc2.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.19.norm1.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.19.norm1.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.19.norm2.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.19.norm2.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.2.attn.proj.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.2.attn.proj.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.2.attn.qkv.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.2.attn.qkv.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.2.mlp.linear_fc1.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.2.mlp.linear_fc1.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.2.mlp.linear_fc2.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.2.mlp.linear_fc2.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.2.norm1.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.2.norm1.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.2.norm2.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.2.norm2.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.20.attn.proj.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.20.attn.proj.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.20.attn.qkv.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.20.attn.qkv.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.20.mlp.linear_fc1.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.20.mlp.linear_fc1.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.20.mlp.linear_fc2.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.20.mlp.linear_fc2.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.20.norm1.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.20.norm1.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.20.norm2.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.20.norm2.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.21.attn.proj.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.21.attn.proj.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.21.attn.qkv.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.21.attn.qkv.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.21.mlp.linear_fc1.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.21.mlp.linear_fc1.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.21.mlp.linear_fc2.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.21.mlp.linear_fc2.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.21.norm1.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.21.norm1.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.21.norm2.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.21.norm2.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.22.attn.proj.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.22.attn.proj.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.22.attn.qkv.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.22.attn.qkv.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.22.mlp.linear_fc1.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.22.mlp.linear_fc1.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.22.mlp.linear_fc2.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.22.mlp.linear_fc2.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.22.norm1.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.22.norm1.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.22.norm2.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.22.norm2.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.23.attn.proj.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.23.attn.proj.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.23.attn.qkv.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.23.attn.qkv.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.23.mlp.linear_fc1.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.23.mlp.linear_fc1.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.23.mlp.linear_fc2.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.23.mlp.linear_fc2.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.23.norm1.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.23.norm1.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.23.norm2.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.23.norm2.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.24.attn.proj.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.24.attn.proj.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.24.attn.qkv.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.24.attn.qkv.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.24.mlp.linear_fc1.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.24.mlp.linear_fc1.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.24.mlp.linear_fc2.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.24.mlp.linear_fc2.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.24.norm1.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.24.norm1.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.24.norm2.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.24.norm2.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.25.attn.proj.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.25.attn.proj.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.25.attn.qkv.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.25.attn.qkv.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.25.mlp.linear_fc1.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.25.mlp.linear_fc1.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.25.mlp.linear_fc2.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.25.mlp.linear_fc2.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.25.norm1.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.25.norm1.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.25.norm2.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.25.norm2.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.26.attn.proj.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.26.attn.proj.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.26.attn.qkv.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.26.attn.qkv.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.26.mlp.linear_fc1.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.26.mlp.linear_fc1.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.26.mlp.linear_fc2.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.26.mlp.linear_fc2.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.26.norm1.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.26.norm1.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.26.norm2.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.26.norm2.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.3.attn.proj.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.3.attn.proj.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.3.attn.qkv.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.3.attn.qkv.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.3.mlp.linear_fc1.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.3.mlp.linear_fc1.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.3.mlp.linear_fc2.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.3.mlp.linear_fc2.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.3.norm1.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.3.norm1.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.3.norm2.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.3.norm2.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.4.attn.proj.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.4.attn.proj.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.4.attn.qkv.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.4.attn.qkv.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.4.mlp.linear_fc1.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.4.mlp.linear_fc1.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.4.mlp.linear_fc2.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.4.mlp.linear_fc2.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.4.norm1.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.4.norm1.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.4.norm2.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.4.norm2.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.5.attn.proj.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.5.attn.proj.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.5.attn.qkv.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.5.attn.qkv.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.5.mlp.linear_fc1.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.5.mlp.linear_fc1.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.5.mlp.linear_fc2.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.5.mlp.linear_fc2.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.5.norm1.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.5.norm1.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.5.norm2.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.5.norm2.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.6.attn.proj.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.6.attn.proj.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.6.attn.qkv.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.6.attn.qkv.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.6.mlp.linear_fc1.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.6.mlp.linear_fc1.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.6.mlp.linear_fc2.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.6.mlp.linear_fc2.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.6.norm1.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.6.norm1.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.6.norm2.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.6.norm2.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.7.attn.proj.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.7.attn.proj.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.7.attn.qkv.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.7.attn.qkv.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.7.mlp.linear_fc1.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.7.mlp.linear_fc1.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.7.mlp.linear_fc2.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.7.mlp.linear_fc2.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.7.norm1.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.7.norm1.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.7.norm2.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.7.norm2.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.8.attn.proj.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.8.attn.proj.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.8.attn.qkv.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.8.attn.qkv.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.8.mlp.linear_fc1.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.8.mlp.linear_fc1.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.8.mlp.linear_fc2.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.8.mlp.linear_fc2.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.8.norm1.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.8.norm1.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.8.norm2.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.8.norm2.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.9.attn.proj.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.9.attn.proj.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.9.attn.qkv.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.9.attn.qkv.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.9.mlp.linear_fc1.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.9.mlp.linear_fc1.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.9.mlp.linear_fc2.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.9.mlp.linear_fc2.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.9.norm1.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.9.norm1.weight": "model-00001-of-00004.safetensors", "model.visual.blocks.9.norm2.bias": "model-00001-of-00004.safetensors", "model.visual.blocks.9.norm2.weight": "model-00001-of-00004.safetensors", "model.visual.merger.linear_fc1.bias": "model-00001-of-00004.safetensors", "model.visual.merger.linear_fc1.weight": "model-00001-of-00004.safetensors", "model.visual.merger.linear_fc2.bias": "model-00001-of-00004.safetensors", "model.visual.merger.linear_fc2.weight": "model-00001-of-00004.safetensors", "model.visual.merger.norm.bias": "model-00001-of-00004.safetensors", "model.visual.merger.norm.weight": "model-00001-of-00004.safetensors", "model.visual.patch_embed.proj.bias": "model-00001-of-00004.safetensors", "model.visual.patch_embed.proj.weight": "model-00001-of-00004.safetensors", "model.visual.pos_embed.weight": "model-00001-of-00004.safetensors" } }