{ "metadata": { "total_parameters": 6352005184, "total_size": 25408020736 }, "weight_map": { "esmc.embed.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.0.attn.k_ln.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.0.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.0.attn.layernorm_qkv.layer_norm_bias": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.0.attn.layernorm_qkv.layer_norm_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.0.attn.layernorm_qkv.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.0.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.0.attn.out_proj.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.0.attn.q_ln.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.0.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.0.ffn.fc1_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.0.ffn.fc2_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.0.ffn.layer_norm_bias": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.0.ffn.layer_norm_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.1.attn.k_ln.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.1.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.1.attn.layernorm_qkv.layer_norm_bias": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.1.attn.layernorm_qkv.layer_norm_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.1.attn.layernorm_qkv.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.1.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.1.attn.out_proj.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.1.attn.q_ln.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.1.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.1.ffn.fc1_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.1.ffn.fc2_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.1.ffn.layer_norm_bias": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.1.ffn.layer_norm_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.10.attn.k_ln.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.10.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.10.attn.layernorm_qkv.layer_norm_bias": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.10.attn.layernorm_qkv.layer_norm_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.10.attn.layernorm_qkv.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.10.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.10.attn.out_proj.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.10.attn.q_ln.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.10.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.10.ffn.fc1_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.10.ffn.fc2_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.10.ffn.layer_norm_bias": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.10.ffn.layer_norm_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.11.attn.k_ln.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.11.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.11.attn.layernorm_qkv.layer_norm_bias": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.11.attn.layernorm_qkv.layer_norm_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.11.attn.layernorm_qkv.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.11.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.11.attn.out_proj.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.11.attn.q_ln.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.11.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.11.ffn.fc1_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.11.ffn.fc2_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.11.ffn.layer_norm_bias": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.11.ffn.layer_norm_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.12.attn.k_ln.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.12.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.12.attn.layernorm_qkv.layer_norm_bias": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.12.attn.layernorm_qkv.layer_norm_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.12.attn.layernorm_qkv.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.12.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.12.attn.out_proj.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.12.attn.q_ln.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.12.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.12.ffn.fc1_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.12.ffn.fc2_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.12.ffn.layer_norm_bias": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.12.ffn.layer_norm_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.13.attn.k_ln.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.13.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.13.attn.layernorm_qkv.layer_norm_bias": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.13.attn.layernorm_qkv.layer_norm_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.13.attn.layernorm_qkv.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.13.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.13.attn.out_proj.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.13.attn.q_ln.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.13.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.13.ffn.fc1_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.13.ffn.fc2_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.13.ffn.layer_norm_bias": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.13.ffn.layer_norm_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.14.attn.k_ln.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.14.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.14.attn.layernorm_qkv.layer_norm_bias": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.14.attn.layernorm_qkv.layer_norm_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.14.attn.layernorm_qkv.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.14.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.14.attn.out_proj.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.14.attn.q_ln.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.14.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.14.ffn.fc1_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.14.ffn.fc2_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.14.ffn.layer_norm_bias": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.14.ffn.layer_norm_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.15.attn.k_ln.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.15.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.15.attn.layernorm_qkv.layer_norm_bias": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.15.attn.layernorm_qkv.layer_norm_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.15.attn.layernorm_qkv.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.15.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.15.attn.out_proj.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.15.attn.q_ln.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.15.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.15.ffn.fc1_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.15.ffn.fc2_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.15.ffn.layer_norm_bias": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.15.ffn.layer_norm_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.16.attn.k_ln.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.16.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.16.attn.layernorm_qkv.layer_norm_bias": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.16.attn.layernorm_qkv.layer_norm_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.16.attn.layernorm_qkv.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.16.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.16.attn.out_proj.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.16.attn.q_ln.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.16.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.16.ffn.fc1_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.16.ffn.fc2_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.16.ffn.layer_norm_bias": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.16.ffn.layer_norm_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.17.attn.k_ln.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.17.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.17.attn.layernorm_qkv.layer_norm_bias": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.17.attn.layernorm_qkv.layer_norm_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.17.attn.layernorm_qkv.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.17.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.17.attn.out_proj.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.17.attn.q_ln.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.17.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.17.ffn.fc1_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.17.ffn.fc2_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.17.ffn.layer_norm_bias": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.17.ffn.layer_norm_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.18.attn.k_ln.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.18.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.18.attn.layernorm_qkv.layer_norm_bias": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.18.attn.layernorm_qkv.layer_norm_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.18.attn.layernorm_qkv.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.18.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.18.attn.out_proj.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.18.attn.q_ln.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.18.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.18.ffn.fc1_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.18.ffn.fc2_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.18.ffn.layer_norm_bias": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.18.ffn.layer_norm_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.19.attn.k_ln.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.19.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.19.attn.layernorm_qkv.layer_norm_bias": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.19.attn.layernorm_qkv.layer_norm_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.19.attn.layernorm_qkv.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.19.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.19.attn.out_proj.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.19.attn.q_ln.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.19.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.19.ffn.fc1_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.19.ffn.fc2_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.19.ffn.layer_norm_bias": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.19.ffn.layer_norm_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.2.attn.k_ln.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.2.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.2.attn.layernorm_qkv.layer_norm_bias": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.2.attn.layernorm_qkv.layer_norm_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.2.attn.layernorm_qkv.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.2.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.2.attn.out_proj.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.2.attn.q_ln.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.2.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.2.ffn.fc1_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.2.ffn.fc2_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.2.ffn.layer_norm_bias": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.2.ffn.layer_norm_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.20.attn.k_ln.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.20.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.20.attn.layernorm_qkv.layer_norm_bias": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.20.attn.layernorm_qkv.layer_norm_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.20.attn.layernorm_qkv.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.20.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.20.attn.out_proj.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.20.attn.q_ln.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.20.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.20.ffn.fc1_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.20.ffn.fc2_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.20.ffn.layer_norm_bias": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.20.ffn.layer_norm_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.21.attn.k_ln.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.21.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.21.attn.layernorm_qkv.layer_norm_bias": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.21.attn.layernorm_qkv.layer_norm_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.21.attn.layernorm_qkv.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.21.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.21.attn.out_proj.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.21.attn.q_ln.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.21.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.21.ffn.fc1_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.21.ffn.fc2_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.21.ffn.layer_norm_bias": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.21.ffn.layer_norm_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.22.attn.k_ln.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.22.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.22.attn.layernorm_qkv.layer_norm_bias": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.22.attn.layernorm_qkv.layer_norm_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.22.attn.layernorm_qkv.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.22.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.22.attn.out_proj.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.22.attn.q_ln.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.22.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.22.ffn.fc1_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.22.ffn.fc2_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.22.ffn.layer_norm_bias": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.22.ffn.layer_norm_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.23.attn.k_ln.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.23.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.23.attn.layernorm_qkv.layer_norm_bias": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.23.attn.layernorm_qkv.layer_norm_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.23.attn.layernorm_qkv.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.23.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.23.attn.out_proj.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.23.attn.q_ln.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.23.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.23.ffn.fc1_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.23.ffn.fc2_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.23.ffn.layer_norm_bias": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.23.ffn.layer_norm_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.24.attn.k_ln.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.24.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.24.attn.layernorm_qkv.layer_norm_bias": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.24.attn.layernorm_qkv.layer_norm_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.24.attn.layernorm_qkv.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.24.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.24.attn.out_proj.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.24.attn.q_ln.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.24.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.24.ffn.fc1_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.24.ffn.fc2_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.24.ffn.layer_norm_bias": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.24.ffn.layer_norm_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.25.attn.k_ln.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.25.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.25.attn.layernorm_qkv.layer_norm_bias": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.25.attn.layernorm_qkv.layer_norm_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.25.attn.layernorm_qkv.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.25.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.25.attn.out_proj.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.25.attn.q_ln.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.25.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.25.ffn.fc1_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.25.ffn.fc2_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.25.ffn.layer_norm_bias": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.25.ffn.layer_norm_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.26.attn.k_ln.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.26.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.26.attn.layernorm_qkv.layer_norm_bias": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.26.attn.layernorm_qkv.layer_norm_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.26.attn.layernorm_qkv.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.26.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.26.attn.out_proj.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.26.attn.q_ln.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.26.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.26.ffn.fc1_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.26.ffn.fc2_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.26.ffn.layer_norm_bias": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.26.ffn.layer_norm_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.27.attn.k_ln.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.27.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.27.attn.layernorm_qkv.layer_norm_bias": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.27.attn.layernorm_qkv.layer_norm_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.27.attn.layernorm_qkv.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.27.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.27.attn.out_proj.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.27.attn.q_ln.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.27.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.27.ffn.fc1_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.27.ffn.fc2_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.27.ffn.layer_norm_bias": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.27.ffn.layer_norm_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.28.attn.k_ln.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.28.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.28.attn.layernorm_qkv.layer_norm_bias": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.28.attn.layernorm_qkv.layer_norm_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.28.attn.layernorm_qkv.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.28.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.28.attn.out_proj.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.28.attn.q_ln.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.28.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.28.ffn.fc1_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.28.ffn.fc2_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.28.ffn.layer_norm_bias": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.28.ffn.layer_norm_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.29.attn.k_ln.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.29.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.29.attn.layernorm_qkv.layer_norm_bias": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.29.attn.layernorm_qkv.layer_norm_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.29.attn.layernorm_qkv.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.29.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.29.attn.out_proj.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.29.attn.q_ln.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.29.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.29.ffn.fc1_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.29.ffn.fc2_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.29.ffn.layer_norm_bias": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.29.ffn.layer_norm_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.3.attn.k_ln.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.3.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.3.attn.layernorm_qkv.layer_norm_bias": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.3.attn.layernorm_qkv.layer_norm_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.3.attn.layernorm_qkv.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.3.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.3.attn.out_proj.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.3.attn.q_ln.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.3.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.3.ffn.fc1_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.3.ffn.fc2_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.3.ffn.layer_norm_bias": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.3.ffn.layer_norm_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.30.attn.k_ln.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.30.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.30.attn.layernorm_qkv.layer_norm_bias": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.30.attn.layernorm_qkv.layer_norm_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.30.attn.layernorm_qkv.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.30.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.30.attn.out_proj.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.30.attn.q_ln.weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.30.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.30.ffn.fc1_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.30.ffn.fc2_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.30.ffn.layer_norm_bias": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.30.ffn.layer_norm_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.31.attn.k_ln.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.31.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.31.attn.layernorm_qkv.layer_norm_bias": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.31.attn.layernorm_qkv.layer_norm_weight": "model-00002-of-00006.safetensors", "esmc.transformer.blocks.31.attn.layernorm_qkv.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.31.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.31.attn.out_proj.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.31.attn.q_ln.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.31.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.31.ffn.fc1_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.31.ffn.fc2_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.31.ffn.layer_norm_bias": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.31.ffn.layer_norm_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.32.attn.k_ln.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.32.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.32.attn.layernorm_qkv.layer_norm_bias": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.32.attn.layernorm_qkv.layer_norm_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.32.attn.layernorm_qkv.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.32.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.32.attn.out_proj.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.32.attn.q_ln.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.32.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.32.ffn.fc1_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.32.ffn.fc2_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.32.ffn.layer_norm_bias": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.32.ffn.layer_norm_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.33.attn.k_ln.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.33.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.33.attn.layernorm_qkv.layer_norm_bias": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.33.attn.layernorm_qkv.layer_norm_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.33.attn.layernorm_qkv.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.33.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.33.attn.out_proj.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.33.attn.q_ln.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.33.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.33.ffn.fc1_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.33.ffn.fc2_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.33.ffn.layer_norm_bias": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.33.ffn.layer_norm_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.34.attn.k_ln.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.34.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.34.attn.layernorm_qkv.layer_norm_bias": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.34.attn.layernorm_qkv.layer_norm_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.34.attn.layernorm_qkv.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.34.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.34.attn.out_proj.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.34.attn.q_ln.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.34.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.34.ffn.fc1_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.34.ffn.fc2_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.34.ffn.layer_norm_bias": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.34.ffn.layer_norm_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.35.attn.k_ln.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.35.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.35.attn.layernorm_qkv.layer_norm_bias": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.35.attn.layernorm_qkv.layer_norm_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.35.attn.layernorm_qkv.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.35.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.35.attn.out_proj.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.35.attn.q_ln.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.35.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.35.ffn.fc1_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.35.ffn.fc2_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.35.ffn.layer_norm_bias": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.35.ffn.layer_norm_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.36.attn.k_ln.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.36.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.36.attn.layernorm_qkv.layer_norm_bias": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.36.attn.layernorm_qkv.layer_norm_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.36.attn.layernorm_qkv.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.36.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.36.attn.out_proj.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.36.attn.q_ln.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.36.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.36.ffn.fc1_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.36.ffn.fc2_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.36.ffn.layer_norm_bias": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.36.ffn.layer_norm_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.37.attn.k_ln.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.37.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.37.attn.layernorm_qkv.layer_norm_bias": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.37.attn.layernorm_qkv.layer_norm_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.37.attn.layernorm_qkv.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.37.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.37.attn.out_proj.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.37.attn.q_ln.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.37.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.37.ffn.fc1_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.37.ffn.fc2_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.37.ffn.layer_norm_bias": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.37.ffn.layer_norm_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.38.attn.k_ln.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.38.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.38.attn.layernorm_qkv.layer_norm_bias": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.38.attn.layernorm_qkv.layer_norm_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.38.attn.layernorm_qkv.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.38.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.38.attn.out_proj.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.38.attn.q_ln.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.38.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.38.ffn.fc1_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.38.ffn.fc2_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.38.ffn.layer_norm_bias": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.38.ffn.layer_norm_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.39.attn.k_ln.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.39.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.39.attn.layernorm_qkv.layer_norm_bias": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.39.attn.layernorm_qkv.layer_norm_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.39.attn.layernorm_qkv.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.39.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.39.attn.out_proj.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.39.attn.q_ln.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.39.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.39.ffn.fc1_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.39.ffn.fc2_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.39.ffn.layer_norm_bias": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.39.ffn.layer_norm_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.4.attn.k_ln.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.4.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.4.attn.layernorm_qkv.layer_norm_bias": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.4.attn.layernorm_qkv.layer_norm_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.4.attn.layernorm_qkv.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.4.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.4.attn.out_proj.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.4.attn.q_ln.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.4.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.4.ffn.fc1_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.4.ffn.fc2_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.4.ffn.layer_norm_bias": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.4.ffn.layer_norm_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.40.attn.k_ln.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.40.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.40.attn.layernorm_qkv.layer_norm_bias": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.40.attn.layernorm_qkv.layer_norm_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.40.attn.layernorm_qkv.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.40.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.40.attn.out_proj.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.40.attn.q_ln.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.40.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.40.ffn.fc1_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.40.ffn.fc2_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.40.ffn.layer_norm_bias": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.40.ffn.layer_norm_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.41.attn.k_ln.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.41.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.41.attn.layernorm_qkv.layer_norm_bias": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.41.attn.layernorm_qkv.layer_norm_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.41.attn.layernorm_qkv.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.41.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.41.attn.out_proj.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.41.attn.q_ln.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.41.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.41.ffn.fc1_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.41.ffn.fc2_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.41.ffn.layer_norm_bias": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.41.ffn.layer_norm_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.42.attn.k_ln.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.42.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.42.attn.layernorm_qkv.layer_norm_bias": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.42.attn.layernorm_qkv.layer_norm_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.42.attn.layernorm_qkv.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.42.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.42.attn.out_proj.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.42.attn.q_ln.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.42.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.42.ffn.fc1_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.42.ffn.fc2_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.42.ffn.layer_norm_bias": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.42.ffn.layer_norm_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.43.attn.k_ln.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.43.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.43.attn.layernorm_qkv.layer_norm_bias": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.43.attn.layernorm_qkv.layer_norm_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.43.attn.layernorm_qkv.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.43.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.43.attn.out_proj.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.43.attn.q_ln.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.43.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.43.ffn.fc1_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.43.ffn.fc2_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.43.ffn.layer_norm_bias": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.43.ffn.layer_norm_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.44.attn.k_ln.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.44.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.44.attn.layernorm_qkv.layer_norm_bias": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.44.attn.layernorm_qkv.layer_norm_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.44.attn.layernorm_qkv.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.44.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.44.attn.out_proj.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.44.attn.q_ln.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.44.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.44.ffn.fc1_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.44.ffn.fc2_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.44.ffn.layer_norm_bias": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.44.ffn.layer_norm_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.45.attn.k_ln.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.45.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.45.attn.layernorm_qkv.layer_norm_bias": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.45.attn.layernorm_qkv.layer_norm_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.45.attn.layernorm_qkv.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.45.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.45.attn.out_proj.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.45.attn.q_ln.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.45.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.45.ffn.fc1_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.45.ffn.fc2_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.45.ffn.layer_norm_bias": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.45.ffn.layer_norm_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.46.attn.k_ln.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.46.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.46.attn.layernorm_qkv.layer_norm_bias": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.46.attn.layernorm_qkv.layer_norm_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.46.attn.layernorm_qkv.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.46.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.46.attn.out_proj.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.46.attn.q_ln.weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.46.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.46.ffn.fc1_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.46.ffn.fc2_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.46.ffn.layer_norm_bias": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.46.ffn.layer_norm_weight": "model-00003-of-00006.safetensors", "esmc.transformer.blocks.47.attn.k_ln.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.47.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.47.attn.layernorm_qkv.layer_norm_bias": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.47.attn.layernorm_qkv.layer_norm_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.47.attn.layernorm_qkv.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.47.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.47.attn.out_proj.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.47.attn.q_ln.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.47.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.47.ffn.fc1_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.47.ffn.fc2_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.47.ffn.layer_norm_bias": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.47.ffn.layer_norm_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.48.attn.k_ln.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.48.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.48.attn.layernorm_qkv.layer_norm_bias": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.48.attn.layernorm_qkv.layer_norm_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.48.attn.layernorm_qkv.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.48.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.48.attn.out_proj.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.48.attn.q_ln.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.48.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.48.ffn.fc1_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.48.ffn.fc2_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.48.ffn.layer_norm_bias": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.48.ffn.layer_norm_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.49.attn.k_ln.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.49.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.49.attn.layernorm_qkv.layer_norm_bias": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.49.attn.layernorm_qkv.layer_norm_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.49.attn.layernorm_qkv.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.49.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.49.attn.out_proj.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.49.attn.q_ln.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.49.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.49.ffn.fc1_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.49.ffn.fc2_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.49.ffn.layer_norm_bias": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.49.ffn.layer_norm_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.5.attn.k_ln.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.5.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.5.attn.layernorm_qkv.layer_norm_bias": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.5.attn.layernorm_qkv.layer_norm_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.5.attn.layernorm_qkv.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.5.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.5.attn.out_proj.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.5.attn.q_ln.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.5.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.5.ffn.fc1_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.5.ffn.fc2_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.5.ffn.layer_norm_bias": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.5.ffn.layer_norm_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.50.attn.k_ln.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.50.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.50.attn.layernorm_qkv.layer_norm_bias": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.50.attn.layernorm_qkv.layer_norm_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.50.attn.layernorm_qkv.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.50.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.50.attn.out_proj.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.50.attn.q_ln.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.50.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.50.ffn.fc1_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.50.ffn.fc2_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.50.ffn.layer_norm_bias": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.50.ffn.layer_norm_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.51.attn.k_ln.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.51.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.51.attn.layernorm_qkv.layer_norm_bias": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.51.attn.layernorm_qkv.layer_norm_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.51.attn.layernorm_qkv.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.51.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.51.attn.out_proj.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.51.attn.q_ln.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.51.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.51.ffn.fc1_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.51.ffn.fc2_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.51.ffn.layer_norm_bias": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.51.ffn.layer_norm_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.52.attn.k_ln.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.52.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.52.attn.layernorm_qkv.layer_norm_bias": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.52.attn.layernorm_qkv.layer_norm_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.52.attn.layernorm_qkv.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.52.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.52.attn.out_proj.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.52.attn.q_ln.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.52.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.52.ffn.fc1_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.52.ffn.fc2_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.52.ffn.layer_norm_bias": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.52.ffn.layer_norm_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.53.attn.k_ln.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.53.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.53.attn.layernorm_qkv.layer_norm_bias": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.53.attn.layernorm_qkv.layer_norm_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.53.attn.layernorm_qkv.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.53.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.53.attn.out_proj.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.53.attn.q_ln.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.53.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.53.ffn.fc1_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.53.ffn.fc2_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.53.ffn.layer_norm_bias": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.53.ffn.layer_norm_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.54.attn.k_ln.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.54.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.54.attn.layernorm_qkv.layer_norm_bias": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.54.attn.layernorm_qkv.layer_norm_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.54.attn.layernorm_qkv.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.54.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.54.attn.out_proj.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.54.attn.q_ln.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.54.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.54.ffn.fc1_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.54.ffn.fc2_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.54.ffn.layer_norm_bias": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.54.ffn.layer_norm_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.55.attn.k_ln.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.55.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.55.attn.layernorm_qkv.layer_norm_bias": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.55.attn.layernorm_qkv.layer_norm_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.55.attn.layernorm_qkv.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.55.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.55.attn.out_proj.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.55.attn.q_ln.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.55.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.55.ffn.fc1_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.55.ffn.fc2_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.55.ffn.layer_norm_bias": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.55.ffn.layer_norm_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.56.attn.k_ln.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.56.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.56.attn.layernorm_qkv.layer_norm_bias": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.56.attn.layernorm_qkv.layer_norm_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.56.attn.layernorm_qkv.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.56.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.56.attn.out_proj.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.56.attn.q_ln.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.56.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.56.ffn.fc1_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.56.ffn.fc2_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.56.ffn.layer_norm_bias": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.56.ffn.layer_norm_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.57.attn.k_ln.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.57.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.57.attn.layernorm_qkv.layer_norm_bias": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.57.attn.layernorm_qkv.layer_norm_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.57.attn.layernorm_qkv.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.57.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.57.attn.out_proj.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.57.attn.q_ln.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.57.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.57.ffn.fc1_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.57.ffn.fc2_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.57.ffn.layer_norm_bias": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.57.ffn.layer_norm_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.58.attn.k_ln.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.58.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.58.attn.layernorm_qkv.layer_norm_bias": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.58.attn.layernorm_qkv.layer_norm_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.58.attn.layernorm_qkv.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.58.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.58.attn.out_proj.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.58.attn.q_ln.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.58.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.58.ffn.fc1_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.58.ffn.fc2_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.58.ffn.layer_norm_bias": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.58.ffn.layer_norm_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.59.attn.k_ln.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.59.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.59.attn.layernorm_qkv.layer_norm_bias": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.59.attn.layernorm_qkv.layer_norm_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.59.attn.layernorm_qkv.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.59.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.59.attn.out_proj.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.59.attn.q_ln.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.59.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.59.ffn.fc1_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.59.ffn.fc2_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.59.ffn.layer_norm_bias": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.59.ffn.layer_norm_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.6.attn.k_ln.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.6.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.6.attn.layernorm_qkv.layer_norm_bias": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.6.attn.layernorm_qkv.layer_norm_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.6.attn.layernorm_qkv.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.6.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.6.attn.out_proj.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.6.attn.q_ln.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.6.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.6.ffn.fc1_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.6.ffn.fc2_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.6.ffn.layer_norm_bias": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.6.ffn.layer_norm_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.60.attn.k_ln.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.60.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.60.attn.layernorm_qkv.layer_norm_bias": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.60.attn.layernorm_qkv.layer_norm_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.60.attn.layernorm_qkv.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.60.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.60.attn.out_proj.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.60.attn.q_ln.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.60.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.60.ffn.fc1_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.60.ffn.fc2_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.60.ffn.layer_norm_bias": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.60.ffn.layer_norm_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.61.attn.k_ln.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.61.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.61.attn.layernorm_qkv.layer_norm_bias": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.61.attn.layernorm_qkv.layer_norm_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.61.attn.layernorm_qkv.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.61.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.61.attn.out_proj.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.61.attn.q_ln.weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.61.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.61.ffn.fc1_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.61.ffn.fc2_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.61.ffn.layer_norm_bias": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.61.ffn.layer_norm_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.62.attn.k_ln.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.62.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.62.attn.layernorm_qkv.layer_norm_bias": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.62.attn.layernorm_qkv.layer_norm_weight": "model-00004-of-00006.safetensors", "esmc.transformer.blocks.62.attn.layernorm_qkv.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.62.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.62.attn.out_proj.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.62.attn.q_ln.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.62.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.62.ffn.fc1_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.62.ffn.fc2_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.62.ffn.layer_norm_bias": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.62.ffn.layer_norm_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.63.attn.k_ln.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.63.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.63.attn.layernorm_qkv.layer_norm_bias": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.63.attn.layernorm_qkv.layer_norm_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.63.attn.layernorm_qkv.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.63.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.63.attn.out_proj.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.63.attn.q_ln.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.63.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.63.ffn.fc1_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.63.ffn.fc2_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.63.ffn.layer_norm_bias": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.63.ffn.layer_norm_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.64.attn.k_ln.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.64.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.64.attn.layernorm_qkv.layer_norm_bias": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.64.attn.layernorm_qkv.layer_norm_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.64.attn.layernorm_qkv.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.64.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.64.attn.out_proj.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.64.attn.q_ln.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.64.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.64.ffn.fc1_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.64.ffn.fc2_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.64.ffn.layer_norm_bias": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.64.ffn.layer_norm_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.65.attn.k_ln.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.65.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.65.attn.layernorm_qkv.layer_norm_bias": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.65.attn.layernorm_qkv.layer_norm_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.65.attn.layernorm_qkv.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.65.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.65.attn.out_proj.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.65.attn.q_ln.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.65.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.65.ffn.fc1_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.65.ffn.fc2_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.65.ffn.layer_norm_bias": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.65.ffn.layer_norm_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.66.attn.k_ln.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.66.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.66.attn.layernorm_qkv.layer_norm_bias": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.66.attn.layernorm_qkv.layer_norm_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.66.attn.layernorm_qkv.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.66.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.66.attn.out_proj.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.66.attn.q_ln.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.66.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.66.ffn.fc1_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.66.ffn.fc2_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.66.ffn.layer_norm_bias": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.66.ffn.layer_norm_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.67.attn.k_ln.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.67.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.67.attn.layernorm_qkv.layer_norm_bias": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.67.attn.layernorm_qkv.layer_norm_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.67.attn.layernorm_qkv.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.67.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.67.attn.out_proj.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.67.attn.q_ln.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.67.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.67.ffn.fc1_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.67.ffn.fc2_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.67.ffn.layer_norm_bias": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.67.ffn.layer_norm_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.68.attn.k_ln.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.68.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.68.attn.layernorm_qkv.layer_norm_bias": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.68.attn.layernorm_qkv.layer_norm_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.68.attn.layernorm_qkv.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.68.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.68.attn.out_proj.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.68.attn.q_ln.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.68.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.68.ffn.fc1_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.68.ffn.fc2_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.68.ffn.layer_norm_bias": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.68.ffn.layer_norm_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.69.attn.k_ln.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.69.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.69.attn.layernorm_qkv.layer_norm_bias": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.69.attn.layernorm_qkv.layer_norm_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.69.attn.layernorm_qkv.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.69.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.69.attn.out_proj.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.69.attn.q_ln.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.69.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.69.ffn.fc1_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.69.ffn.fc2_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.69.ffn.layer_norm_bias": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.69.ffn.layer_norm_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.7.attn.k_ln.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.7.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.7.attn.layernorm_qkv.layer_norm_bias": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.7.attn.layernorm_qkv.layer_norm_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.7.attn.layernorm_qkv.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.7.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.7.attn.out_proj.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.7.attn.q_ln.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.7.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.7.ffn.fc1_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.7.ffn.fc2_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.7.ffn.layer_norm_bias": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.7.ffn.layer_norm_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.70.attn.k_ln.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.70.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.70.attn.layernorm_qkv.layer_norm_bias": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.70.attn.layernorm_qkv.layer_norm_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.70.attn.layernorm_qkv.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.70.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.70.attn.out_proj.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.70.attn.q_ln.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.70.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.70.ffn.fc1_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.70.ffn.fc2_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.70.ffn.layer_norm_bias": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.70.ffn.layer_norm_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.71.attn.k_ln.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.71.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.71.attn.layernorm_qkv.layer_norm_bias": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.71.attn.layernorm_qkv.layer_norm_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.71.attn.layernorm_qkv.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.71.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.71.attn.out_proj.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.71.attn.q_ln.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.71.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.71.ffn.fc1_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.71.ffn.fc2_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.71.ffn.layer_norm_bias": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.71.ffn.layer_norm_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.72.attn.k_ln.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.72.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.72.attn.layernorm_qkv.layer_norm_bias": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.72.attn.layernorm_qkv.layer_norm_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.72.attn.layernorm_qkv.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.72.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.72.attn.out_proj.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.72.attn.q_ln.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.72.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.72.ffn.fc1_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.72.ffn.fc2_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.72.ffn.layer_norm_bias": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.72.ffn.layer_norm_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.73.attn.k_ln.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.73.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.73.attn.layernorm_qkv.layer_norm_bias": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.73.attn.layernorm_qkv.layer_norm_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.73.attn.layernorm_qkv.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.73.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.73.attn.out_proj.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.73.attn.q_ln.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.73.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.73.ffn.fc1_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.73.ffn.fc2_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.73.ffn.layer_norm_bias": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.73.ffn.layer_norm_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.74.attn.k_ln.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.74.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.74.attn.layernorm_qkv.layer_norm_bias": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.74.attn.layernorm_qkv.layer_norm_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.74.attn.layernorm_qkv.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.74.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.74.attn.out_proj.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.74.attn.q_ln.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.74.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.74.ffn.fc1_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.74.ffn.fc2_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.74.ffn.layer_norm_bias": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.74.ffn.layer_norm_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.75.attn.k_ln.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.75.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.75.attn.layernorm_qkv.layer_norm_bias": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.75.attn.layernorm_qkv.layer_norm_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.75.attn.layernorm_qkv.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.75.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.75.attn.out_proj.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.75.attn.q_ln.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.75.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.75.ffn.fc1_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.75.ffn.fc2_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.75.ffn.layer_norm_bias": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.75.ffn.layer_norm_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.76.attn.k_ln.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.76.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.76.attn.layernorm_qkv.layer_norm_bias": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.76.attn.layernorm_qkv.layer_norm_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.76.attn.layernorm_qkv.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.76.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.76.attn.out_proj.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.76.attn.q_ln.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.76.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.76.ffn.fc1_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.76.ffn.fc2_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.76.ffn.layer_norm_bias": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.76.ffn.layer_norm_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.77.attn.k_ln.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.77.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.77.attn.layernorm_qkv.layer_norm_bias": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.77.attn.layernorm_qkv.layer_norm_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.77.attn.layernorm_qkv.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.77.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.77.attn.out_proj.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.77.attn.q_ln.weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.77.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.77.ffn.fc1_weight": "model-00006-of-00006.safetensors", "esmc.transformer.blocks.77.ffn.fc2_weight": "model-00006-of-00006.safetensors", "esmc.transformer.blocks.77.ffn.layer_norm_bias": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.77.ffn.layer_norm_weight": "model-00005-of-00006.safetensors", "esmc.transformer.blocks.78.attn.k_ln.weight": "model-00006-of-00006.safetensors", "esmc.transformer.blocks.78.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.78.attn.layernorm_qkv.layer_norm_bias": "model-00006-of-00006.safetensors", "esmc.transformer.blocks.78.attn.layernorm_qkv.layer_norm_weight": "model-00006-of-00006.safetensors", "esmc.transformer.blocks.78.attn.layernorm_qkv.weight": "model-00006-of-00006.safetensors", "esmc.transformer.blocks.78.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.78.attn.out_proj.weight": "model-00006-of-00006.safetensors", "esmc.transformer.blocks.78.attn.q_ln.weight": "model-00006-of-00006.safetensors", "esmc.transformer.blocks.78.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.78.ffn.fc1_weight": "model-00006-of-00006.safetensors", "esmc.transformer.blocks.78.ffn.fc2_weight": "model-00006-of-00006.safetensors", "esmc.transformer.blocks.78.ffn.layer_norm_bias": "model-00006-of-00006.safetensors", "esmc.transformer.blocks.78.ffn.layer_norm_weight": "model-00006-of-00006.safetensors", "esmc.transformer.blocks.79.attn.k_ln.weight": "model-00006-of-00006.safetensors", "esmc.transformer.blocks.79.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.79.attn.layernorm_qkv.layer_norm_bias": "model-00006-of-00006.safetensors", "esmc.transformer.blocks.79.attn.layernorm_qkv.layer_norm_weight": "model-00006-of-00006.safetensors", "esmc.transformer.blocks.79.attn.layernorm_qkv.weight": "model-00006-of-00006.safetensors", "esmc.transformer.blocks.79.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.79.attn.out_proj.weight": "model-00006-of-00006.safetensors", "esmc.transformer.blocks.79.attn.q_ln.weight": "model-00006-of-00006.safetensors", "esmc.transformer.blocks.79.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.79.ffn.fc1_weight": "model-00006-of-00006.safetensors", "esmc.transformer.blocks.79.ffn.fc2_weight": "model-00006-of-00006.safetensors", "esmc.transformer.blocks.79.ffn.layer_norm_bias": "model-00006-of-00006.safetensors", "esmc.transformer.blocks.79.ffn.layer_norm_weight": "model-00006-of-00006.safetensors", "esmc.transformer.blocks.8.attn.k_ln.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.8.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.8.attn.layernorm_qkv.layer_norm_bias": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.8.attn.layernorm_qkv.layer_norm_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.8.attn.layernorm_qkv.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.8.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.8.attn.out_proj.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.8.attn.q_ln.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.8.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.8.ffn.fc1_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.8.ffn.fc2_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.8.ffn.layer_norm_bias": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.8.ffn.layer_norm_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.9.attn.k_ln.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.9.attn.layernorm_qkv._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.9.attn.layernorm_qkv.layer_norm_bias": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.9.attn.layernorm_qkv.layer_norm_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.9.attn.layernorm_qkv.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.9.attn.out_proj._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.9.attn.out_proj.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.9.attn.q_ln.weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.9.ffn._extra_state": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.9.ffn.fc1_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.9.ffn.fc2_weight": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.9.ffn.layer_norm_bias": "model-00001-of-00006.safetensors", "esmc.transformer.blocks.9.ffn.layer_norm_weight": "model-00001-of-00006.safetensors", "esmc.transformer.norm.weight": "model-00006-of-00006.safetensors", "lm_head.0.bias": "model-00006-of-00006.safetensors", "lm_head.0.weight": "model-00006-of-00006.safetensors", "lm_head.2.bias": "model-00006-of-00006.safetensors", "lm_head.2.weight": "model-00006-of-00006.safetensors", "lm_head.3.bias": "model-00006-of-00006.safetensors", "lm_head.3.weight": "model-00006-of-00006.safetensors" } }