{ "metadata": { "total_parameters": 5490589204, "total_size": 21789904208 }, "weight_map": { "lm_head.weight": "model-00005-of-00005.safetensors", "model.action_expert.action_embed.bias": "model-00004-of-00005.safetensors", "model.action_expert.action_embed.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.0.cross_attn.out_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.0.cross_attn.out_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.0.cross_attn.q_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.0.cross_attn.q_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.0.mlp.down_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.0.mlp.down_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.0.mlp.gate_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.0.mlp.gate_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.0.mlp.up_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.0.mlp.up_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.0.modulation.linear.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.0.modulation.linear.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.0.self_attn.out_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.0.self_attn.out_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.0.self_attn.qkv.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.0.self_attn.qkv.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.1.cross_attn.out_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.1.cross_attn.out_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.1.cross_attn.q_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.1.cross_attn.q_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.1.mlp.down_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.1.mlp.down_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.1.mlp.gate_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.1.mlp.gate_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.1.mlp.up_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.1.mlp.up_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.1.modulation.linear.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.1.modulation.linear.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.1.self_attn.out_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.1.self_attn.out_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.1.self_attn.qkv.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.1.self_attn.qkv.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.10.cross_attn.out_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.10.cross_attn.out_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.10.cross_attn.q_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.10.cross_attn.q_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.10.mlp.down_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.10.mlp.down_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.10.mlp.gate_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.10.mlp.gate_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.10.mlp.up_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.10.mlp.up_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.10.modulation.linear.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.10.modulation.linear.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.10.self_attn.out_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.10.self_attn.out_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.10.self_attn.qkv.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.10.self_attn.qkv.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.11.cross_attn.out_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.11.cross_attn.out_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.11.cross_attn.q_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.11.cross_attn.q_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.11.mlp.down_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.11.mlp.down_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.11.mlp.gate_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.11.mlp.gate_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.11.mlp.up_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.11.mlp.up_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.11.modulation.linear.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.11.modulation.linear.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.11.self_attn.out_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.11.self_attn.out_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.11.self_attn.qkv.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.11.self_attn.qkv.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.12.cross_attn.out_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.12.cross_attn.out_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.12.cross_attn.q_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.12.cross_attn.q_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.12.mlp.down_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.12.mlp.down_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.12.mlp.gate_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.12.mlp.gate_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.12.mlp.up_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.12.mlp.up_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.12.modulation.linear.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.12.modulation.linear.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.12.self_attn.out_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.12.self_attn.out_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.12.self_attn.qkv.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.12.self_attn.qkv.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.13.cross_attn.out_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.13.cross_attn.out_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.13.cross_attn.q_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.13.cross_attn.q_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.13.mlp.down_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.13.mlp.down_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.13.mlp.gate_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.13.mlp.gate_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.13.mlp.up_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.13.mlp.up_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.13.modulation.linear.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.13.modulation.linear.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.13.self_attn.out_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.13.self_attn.out_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.13.self_attn.qkv.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.13.self_attn.qkv.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.14.cross_attn.out_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.14.cross_attn.out_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.14.cross_attn.q_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.14.cross_attn.q_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.14.mlp.down_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.14.mlp.down_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.14.mlp.gate_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.14.mlp.gate_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.14.mlp.up_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.14.mlp.up_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.14.modulation.linear.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.14.modulation.linear.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.14.self_attn.out_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.14.self_attn.out_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.14.self_attn.qkv.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.14.self_attn.qkv.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.15.cross_attn.out_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.15.cross_attn.out_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.15.cross_attn.q_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.15.cross_attn.q_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.15.mlp.down_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.15.mlp.down_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.15.mlp.gate_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.15.mlp.gate_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.15.mlp.up_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.15.mlp.up_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.15.modulation.linear.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.15.modulation.linear.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.15.self_attn.out_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.15.self_attn.out_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.15.self_attn.qkv.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.15.self_attn.qkv.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.16.cross_attn.out_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.16.cross_attn.out_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.16.cross_attn.q_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.16.cross_attn.q_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.16.mlp.down_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.16.mlp.down_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.16.mlp.gate_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.16.mlp.gate_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.16.mlp.up_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.16.mlp.up_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.16.modulation.linear.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.16.modulation.linear.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.16.self_attn.out_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.16.self_attn.out_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.16.self_attn.qkv.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.16.self_attn.qkv.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.17.cross_attn.out_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.17.cross_attn.out_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.17.cross_attn.q_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.17.cross_attn.q_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.17.mlp.down_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.17.mlp.down_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.17.mlp.gate_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.17.mlp.gate_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.17.mlp.up_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.17.mlp.up_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.17.modulation.linear.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.17.modulation.linear.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.17.self_attn.out_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.17.self_attn.out_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.17.self_attn.qkv.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.17.self_attn.qkv.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.18.cross_attn.out_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.18.cross_attn.out_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.18.cross_attn.q_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.18.cross_attn.q_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.18.mlp.down_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.18.mlp.down_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.18.mlp.gate_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.18.mlp.gate_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.18.mlp.up_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.18.mlp.up_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.18.modulation.linear.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.18.modulation.linear.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.18.self_attn.out_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.18.self_attn.out_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.18.self_attn.qkv.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.18.self_attn.qkv.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.19.cross_attn.out_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.19.cross_attn.out_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.19.cross_attn.q_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.19.cross_attn.q_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.19.mlp.down_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.19.mlp.down_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.19.mlp.gate_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.19.mlp.gate_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.19.mlp.up_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.19.mlp.up_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.19.modulation.linear.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.19.modulation.linear.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.19.self_attn.out_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.19.self_attn.out_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.19.self_attn.qkv.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.19.self_attn.qkv.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.2.cross_attn.out_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.2.cross_attn.out_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.2.cross_attn.q_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.2.cross_attn.q_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.2.mlp.down_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.2.mlp.down_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.2.mlp.gate_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.2.mlp.gate_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.2.mlp.up_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.2.mlp.up_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.2.modulation.linear.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.2.modulation.linear.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.2.self_attn.out_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.2.self_attn.out_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.2.self_attn.qkv.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.2.self_attn.qkv.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.20.cross_attn.out_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.20.cross_attn.out_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.20.cross_attn.q_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.20.cross_attn.q_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.20.mlp.down_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.20.mlp.down_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.20.mlp.gate_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.20.mlp.gate_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.20.mlp.up_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.20.mlp.up_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.20.modulation.linear.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.20.modulation.linear.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.20.self_attn.out_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.20.self_attn.out_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.20.self_attn.qkv.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.20.self_attn.qkv.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.21.cross_attn.out_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.21.cross_attn.out_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.21.cross_attn.q_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.21.cross_attn.q_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.21.mlp.down_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.21.mlp.down_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.21.mlp.gate_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.21.mlp.gate_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.21.mlp.up_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.21.mlp.up_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.21.modulation.linear.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.21.modulation.linear.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.21.self_attn.out_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.21.self_attn.out_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.21.self_attn.qkv.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.21.self_attn.qkv.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.22.cross_attn.out_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.22.cross_attn.out_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.22.cross_attn.q_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.22.cross_attn.q_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.22.mlp.down_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.22.mlp.down_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.22.mlp.gate_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.22.mlp.gate_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.22.mlp.up_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.22.mlp.up_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.22.modulation.linear.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.22.modulation.linear.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.22.self_attn.out_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.22.self_attn.out_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.22.self_attn.qkv.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.22.self_attn.qkv.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.23.cross_attn.out_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.23.cross_attn.out_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.23.cross_attn.q_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.23.cross_attn.q_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.23.mlp.down_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.23.mlp.down_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.23.mlp.gate_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.23.mlp.gate_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.23.mlp.up_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.23.mlp.up_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.23.modulation.linear.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.23.modulation.linear.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.23.self_attn.out_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.23.self_attn.out_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.23.self_attn.qkv.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.23.self_attn.qkv.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.24.cross_attn.out_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.24.cross_attn.out_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.24.cross_attn.q_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.24.cross_attn.q_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.24.mlp.down_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.24.mlp.down_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.24.mlp.gate_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.24.mlp.gate_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.24.mlp.up_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.24.mlp.up_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.24.modulation.linear.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.24.modulation.linear.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.24.self_attn.out_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.24.self_attn.out_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.24.self_attn.qkv.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.24.self_attn.qkv.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.25.cross_attn.out_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.25.cross_attn.out_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.25.cross_attn.q_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.25.cross_attn.q_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.25.mlp.down_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.25.mlp.down_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.25.mlp.gate_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.25.mlp.gate_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.25.mlp.up_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.25.mlp.up_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.25.modulation.linear.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.25.modulation.linear.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.25.self_attn.out_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.25.self_attn.out_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.25.self_attn.qkv.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.25.self_attn.qkv.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.26.cross_attn.out_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.26.cross_attn.out_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.26.cross_attn.q_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.26.cross_attn.q_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.26.mlp.down_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.26.mlp.down_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.26.mlp.gate_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.26.mlp.gate_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.26.mlp.up_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.26.mlp.up_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.26.modulation.linear.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.26.modulation.linear.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.26.self_attn.out_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.26.self_attn.out_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.26.self_attn.qkv.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.26.self_attn.qkv.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.27.cross_attn.out_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.27.cross_attn.out_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.27.cross_attn.q_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.27.cross_attn.q_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.27.mlp.down_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.27.mlp.down_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.27.mlp.gate_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.27.mlp.gate_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.27.mlp.up_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.27.mlp.up_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.27.modulation.linear.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.27.modulation.linear.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.27.self_attn.out_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.27.self_attn.out_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.27.self_attn.qkv.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.27.self_attn.qkv.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.28.cross_attn.out_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.28.cross_attn.out_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.28.cross_attn.q_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.28.cross_attn.q_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.28.mlp.down_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.28.mlp.down_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.28.mlp.gate_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.28.mlp.gate_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.28.mlp.up_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.28.mlp.up_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.28.modulation.linear.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.28.modulation.linear.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.28.self_attn.out_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.28.self_attn.out_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.28.self_attn.qkv.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.28.self_attn.qkv.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.29.cross_attn.out_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.29.cross_attn.out_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.29.cross_attn.q_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.29.cross_attn.q_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.29.mlp.down_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.29.mlp.down_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.29.mlp.gate_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.29.mlp.gate_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.29.mlp.up_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.29.mlp.up_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.29.modulation.linear.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.29.modulation.linear.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.29.self_attn.out_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.29.self_attn.out_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.29.self_attn.qkv.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.29.self_attn.qkv.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.3.cross_attn.out_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.3.cross_attn.out_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.3.cross_attn.q_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.3.cross_attn.q_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.3.mlp.down_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.3.mlp.down_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.3.mlp.gate_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.3.mlp.gate_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.3.mlp.up_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.3.mlp.up_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.3.modulation.linear.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.3.modulation.linear.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.3.self_attn.out_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.3.self_attn.out_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.3.self_attn.qkv.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.3.self_attn.qkv.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.30.cross_attn.out_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.30.cross_attn.out_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.30.cross_attn.q_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.30.cross_attn.q_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.30.mlp.down_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.30.mlp.down_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.30.mlp.gate_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.30.mlp.gate_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.30.mlp.up_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.30.mlp.up_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.30.modulation.linear.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.30.modulation.linear.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.30.self_attn.out_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.30.self_attn.out_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.30.self_attn.qkv.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.30.self_attn.qkv.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.31.cross_attn.out_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.31.cross_attn.out_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.31.cross_attn.q_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.31.cross_attn.q_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.31.mlp.down_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.31.mlp.down_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.31.mlp.gate_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.31.mlp.gate_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.31.mlp.up_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.31.mlp.up_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.31.modulation.linear.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.31.modulation.linear.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.31.self_attn.out_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.31.self_attn.out_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.31.self_attn.qkv.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.31.self_attn.qkv.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.32.cross_attn.out_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.32.cross_attn.out_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.32.cross_attn.q_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.32.cross_attn.q_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.32.mlp.down_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.32.mlp.down_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.32.mlp.gate_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.32.mlp.gate_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.32.mlp.up_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.32.mlp.up_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.32.modulation.linear.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.32.modulation.linear.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.32.self_attn.out_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.32.self_attn.out_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.32.self_attn.qkv.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.32.self_attn.qkv.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.33.cross_attn.out_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.33.cross_attn.out_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.33.cross_attn.q_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.33.cross_attn.q_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.33.mlp.down_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.33.mlp.down_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.33.mlp.gate_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.33.mlp.gate_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.33.mlp.up_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.33.mlp.up_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.33.modulation.linear.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.33.modulation.linear.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.33.self_attn.out_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.33.self_attn.out_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.33.self_attn.qkv.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.33.self_attn.qkv.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.34.cross_attn.out_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.34.cross_attn.out_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.34.cross_attn.q_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.34.cross_attn.q_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.34.mlp.down_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.34.mlp.down_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.34.mlp.gate_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.34.mlp.gate_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.34.mlp.up_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.34.mlp.up_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.34.modulation.linear.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.34.modulation.linear.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.34.self_attn.out_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.34.self_attn.out_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.34.self_attn.qkv.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.34.self_attn.qkv.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.35.cross_attn.out_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.35.cross_attn.out_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.35.cross_attn.q_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.35.cross_attn.q_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.35.mlp.down_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.35.mlp.down_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.35.mlp.gate_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.35.mlp.gate_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.35.mlp.up_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.35.mlp.up_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.35.modulation.linear.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.35.modulation.linear.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.35.self_attn.out_proj.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.35.self_attn.out_proj.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.35.self_attn.qkv.bias": "model-00005-of-00005.safetensors", "model.action_expert.blocks.35.self_attn.qkv.weight": "model-00005-of-00005.safetensors", "model.action_expert.blocks.4.cross_attn.out_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.4.cross_attn.out_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.4.cross_attn.q_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.4.cross_attn.q_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.4.mlp.down_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.4.mlp.down_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.4.mlp.gate_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.4.mlp.gate_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.4.mlp.up_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.4.mlp.up_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.4.modulation.linear.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.4.modulation.linear.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.4.self_attn.out_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.4.self_attn.out_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.4.self_attn.qkv.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.4.self_attn.qkv.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.5.cross_attn.out_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.5.cross_attn.out_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.5.cross_attn.q_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.5.cross_attn.q_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.5.mlp.down_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.5.mlp.down_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.5.mlp.gate_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.5.mlp.gate_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.5.mlp.up_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.5.mlp.up_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.5.modulation.linear.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.5.modulation.linear.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.5.self_attn.out_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.5.self_attn.out_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.5.self_attn.qkv.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.5.self_attn.qkv.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.6.cross_attn.out_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.6.cross_attn.out_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.6.cross_attn.q_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.6.cross_attn.q_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.6.mlp.down_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.6.mlp.down_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.6.mlp.gate_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.6.mlp.gate_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.6.mlp.up_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.6.mlp.up_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.6.modulation.linear.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.6.modulation.linear.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.6.self_attn.out_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.6.self_attn.out_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.6.self_attn.qkv.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.6.self_attn.qkv.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.7.cross_attn.out_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.7.cross_attn.out_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.7.cross_attn.q_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.7.cross_attn.q_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.7.mlp.down_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.7.mlp.down_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.7.mlp.gate_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.7.mlp.gate_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.7.mlp.up_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.7.mlp.up_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.7.modulation.linear.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.7.modulation.linear.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.7.self_attn.out_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.7.self_attn.out_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.7.self_attn.qkv.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.7.self_attn.qkv.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.8.cross_attn.out_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.8.cross_attn.out_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.8.cross_attn.q_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.8.cross_attn.q_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.8.mlp.down_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.8.mlp.down_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.8.mlp.gate_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.8.mlp.gate_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.8.mlp.up_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.8.mlp.up_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.8.modulation.linear.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.8.modulation.linear.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.8.self_attn.out_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.8.self_attn.out_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.8.self_attn.qkv.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.8.self_attn.qkv.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.9.cross_attn.out_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.9.cross_attn.out_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.9.cross_attn.q_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.9.cross_attn.q_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.9.mlp.down_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.9.mlp.down_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.9.mlp.gate_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.9.mlp.gate_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.9.mlp.up_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.9.mlp.up_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.9.modulation.linear.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.9.modulation.linear.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.9.self_attn.out_proj.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.9.self_attn.out_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.blocks.9.self_attn.qkv.bias": "model-00004-of-00005.safetensors", "model.action_expert.blocks.9.self_attn.qkv.weight": "model-00004-of-00005.safetensors", "model.action_expert.context_k_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.context_v_proj.weight": "model-00004-of-00005.safetensors", "model.action_expert.final_layer.linear.bias": "model-00005-of-00005.safetensors", "model.action_expert.final_layer.linear.weight": "model-00005-of-00005.safetensors", "model.action_expert.final_layer.modulation.linear.bias": "model-00005-of-00005.safetensors", "model.action_expert.final_layer.modulation.linear.weight": "model-00005-of-00005.safetensors", "model.action_expert.time_embed.1.bias": "model-00004-of-00005.safetensors", "model.action_expert.time_embed.1.weight": "model-00004-of-00005.safetensors", "model.action_expert.time_embed.3.bias": "model-00004-of-00005.safetensors", "model.action_expert.time_embed.3.weight": "model-00004-of-00005.safetensors", "model.action_expert_depth_gate.0.bias": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.0.weight": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.1.bias": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.1.weight": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.10.bias": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.10.weight": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.11.bias": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.11.weight": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.12.bias": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.12.weight": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.13.bias": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.13.weight": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.14.bias": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.14.weight": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.15.bias": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.15.weight": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.16.bias": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.16.weight": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.17.bias": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.17.weight": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.18.bias": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.18.weight": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.19.bias": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.19.weight": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.2.bias": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.2.weight": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.20.bias": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.20.weight": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.21.bias": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.21.weight": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.22.bias": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.22.weight": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.23.bias": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.23.weight": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.24.bias": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.24.weight": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.25.bias": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.25.weight": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.26.bias": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.26.weight": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.27.bias": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.27.weight": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.28.bias": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.28.weight": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.29.bias": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.29.weight": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.3.bias": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.3.weight": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.30.bias": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.30.weight": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.31.bias": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.31.weight": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.32.bias": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.32.weight": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.33.bias": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.33.weight": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.34.bias": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.34.weight": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.35.bias": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.35.weight": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.4.bias": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.4.weight": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.5.bias": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.5.weight": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.6.bias": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.6.weight": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.7.bias": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.7.weight": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.8.bias": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.8.weight": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.9.bias": "model-00005-of-00005.safetensors", "model.action_expert_depth_gate.9.weight": "model-00005-of-00005.safetensors", "model.transformer.blocks.0.attn_norm.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.0.ff_norm.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.0.mlp.ff_out.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.0.mlp.ff_proj.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.0.self_attn.att_proj.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.0.self_attn.attn_out.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.0.self_attn.k_norm.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.0.self_attn.q_norm.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.1.attn_norm.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.1.ff_norm.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.1.mlp.ff_out.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.1.mlp.ff_proj.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.1.self_attn.att_proj.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.1.self_attn.attn_out.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.1.self_attn.k_norm.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.1.self_attn.q_norm.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.10.attn_norm.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.10.ff_norm.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.10.mlp.ff_out.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.10.mlp.ff_proj.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.10.self_attn.att_proj.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.10.self_attn.attn_out.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.10.self_attn.k_norm.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.10.self_attn.q_norm.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.11.attn_norm.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.11.ff_norm.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.11.mlp.ff_out.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.11.mlp.ff_proj.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.11.self_attn.att_proj.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.11.self_attn.attn_out.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.11.self_attn.k_norm.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.11.self_attn.q_norm.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.12.attn_norm.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.12.ff_norm.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.12.mlp.ff_out.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.12.mlp.ff_proj.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.12.self_attn.att_proj.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.12.self_attn.attn_out.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.12.self_attn.k_norm.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.12.self_attn.q_norm.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.13.attn_norm.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.13.ff_norm.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.13.mlp.ff_out.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.13.mlp.ff_proj.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.13.self_attn.att_proj.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.13.self_attn.attn_out.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.13.self_attn.k_norm.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.13.self_attn.q_norm.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.14.attn_norm.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.14.ff_norm.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.14.mlp.ff_out.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.14.mlp.ff_proj.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.14.self_attn.att_proj.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.14.self_attn.attn_out.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.14.self_attn.k_norm.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.14.self_attn.q_norm.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.15.attn_norm.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.15.ff_norm.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.15.mlp.ff_out.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.15.mlp.ff_proj.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.15.self_attn.att_proj.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.15.self_attn.attn_out.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.15.self_attn.k_norm.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.15.self_attn.q_norm.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.16.attn_norm.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.16.ff_norm.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.16.mlp.ff_out.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.16.mlp.ff_proj.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.16.self_attn.att_proj.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.16.self_attn.attn_out.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.16.self_attn.k_norm.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.16.self_attn.q_norm.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.17.attn_norm.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.17.ff_norm.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.17.mlp.ff_out.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.17.mlp.ff_proj.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.17.self_attn.att_proj.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.17.self_attn.attn_out.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.17.self_attn.k_norm.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.17.self_attn.q_norm.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.18.attn_norm.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.18.ff_norm.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.18.mlp.ff_out.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.18.mlp.ff_proj.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.18.self_attn.att_proj.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.18.self_attn.attn_out.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.18.self_attn.k_norm.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.18.self_attn.q_norm.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.19.attn_norm.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.19.ff_norm.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.19.mlp.ff_out.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.19.mlp.ff_proj.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.19.self_attn.att_proj.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.19.self_attn.attn_out.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.19.self_attn.k_norm.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.19.self_attn.q_norm.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.2.attn_norm.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.2.ff_norm.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.2.mlp.ff_out.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.2.mlp.ff_proj.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.2.self_attn.att_proj.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.2.self_attn.attn_out.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.2.self_attn.k_norm.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.2.self_attn.q_norm.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.20.attn_norm.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.20.ff_norm.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.20.mlp.ff_out.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.20.mlp.ff_proj.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.20.self_attn.att_proj.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.20.self_attn.attn_out.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.20.self_attn.k_norm.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.20.self_attn.q_norm.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.21.attn_norm.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.21.ff_norm.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.21.mlp.ff_out.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.21.mlp.ff_proj.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.21.self_attn.att_proj.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.21.self_attn.attn_out.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.21.self_attn.k_norm.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.21.self_attn.q_norm.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.22.attn_norm.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.22.ff_norm.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.22.mlp.ff_out.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.22.mlp.ff_proj.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.22.self_attn.att_proj.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.22.self_attn.attn_out.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.22.self_attn.k_norm.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.22.self_attn.q_norm.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.23.attn_norm.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.23.ff_norm.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.23.mlp.ff_out.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.23.mlp.ff_proj.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.23.self_attn.att_proj.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.23.self_attn.attn_out.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.23.self_attn.k_norm.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.23.self_attn.q_norm.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.24.attn_norm.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.24.ff_norm.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.24.mlp.ff_out.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.24.mlp.ff_proj.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.24.self_attn.att_proj.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.24.self_attn.attn_out.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.24.self_attn.k_norm.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.24.self_attn.q_norm.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.25.attn_norm.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.25.ff_norm.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.25.mlp.ff_out.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.25.mlp.ff_proj.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.25.self_attn.att_proj.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.25.self_attn.attn_out.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.25.self_attn.k_norm.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.25.self_attn.q_norm.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.26.attn_norm.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.26.ff_norm.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.26.mlp.ff_out.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.26.mlp.ff_proj.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.26.self_attn.att_proj.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.26.self_attn.attn_out.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.26.self_attn.k_norm.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.26.self_attn.q_norm.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.27.attn_norm.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.27.ff_norm.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.27.mlp.ff_out.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.27.mlp.ff_proj.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.27.self_attn.att_proj.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.27.self_attn.attn_out.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.27.self_attn.k_norm.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.27.self_attn.q_norm.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.28.attn_norm.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.28.ff_norm.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.28.mlp.ff_out.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.28.mlp.ff_proj.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.28.self_attn.att_proj.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.28.self_attn.attn_out.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.28.self_attn.k_norm.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.28.self_attn.q_norm.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.29.attn_norm.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.29.ff_norm.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.29.mlp.ff_out.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.29.mlp.ff_proj.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.29.self_attn.att_proj.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.29.self_attn.attn_out.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.29.self_attn.k_norm.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.29.self_attn.q_norm.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.3.attn_norm.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.3.ff_norm.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.3.mlp.ff_out.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.3.mlp.ff_proj.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.3.self_attn.att_proj.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.3.self_attn.attn_out.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.3.self_attn.k_norm.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.3.self_attn.q_norm.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.30.attn_norm.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.30.ff_norm.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.30.mlp.ff_out.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.30.mlp.ff_proj.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.30.self_attn.att_proj.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.30.self_attn.attn_out.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.30.self_attn.k_norm.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.30.self_attn.q_norm.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.31.attn_norm.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.31.ff_norm.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.31.mlp.ff_out.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.31.mlp.ff_proj.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.31.self_attn.att_proj.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.31.self_attn.attn_out.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.31.self_attn.k_norm.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.31.self_attn.q_norm.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.32.attn_norm.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.32.ff_norm.weight": "model-00004-of-00005.safetensors", "model.transformer.blocks.32.mlp.ff_out.weight": "model-00004-of-00005.safetensors", "model.transformer.blocks.32.mlp.ff_proj.weight": "model-00004-of-00005.safetensors", "model.transformer.blocks.32.self_attn.att_proj.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.32.self_attn.attn_out.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.32.self_attn.k_norm.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.32.self_attn.q_norm.weight": "model-00003-of-00005.safetensors", "model.transformer.blocks.33.attn_norm.weight": "model-00004-of-00005.safetensors", "model.transformer.blocks.33.ff_norm.weight": "model-00004-of-00005.safetensors", "model.transformer.blocks.33.mlp.ff_out.weight": "model-00004-of-00005.safetensors", "model.transformer.blocks.33.mlp.ff_proj.weight": "model-00004-of-00005.safetensors", "model.transformer.blocks.33.self_attn.att_proj.weight": "model-00004-of-00005.safetensors", "model.transformer.blocks.33.self_attn.attn_out.weight": "model-00004-of-00005.safetensors", "model.transformer.blocks.33.self_attn.k_norm.weight": "model-00004-of-00005.safetensors", "model.transformer.blocks.33.self_attn.q_norm.weight": "model-00004-of-00005.safetensors", "model.transformer.blocks.34.attn_norm.weight": "model-00004-of-00005.safetensors", "model.transformer.blocks.34.ff_norm.weight": "model-00004-of-00005.safetensors", "model.transformer.blocks.34.mlp.ff_out.weight": "model-00004-of-00005.safetensors", "model.transformer.blocks.34.mlp.ff_proj.weight": "model-00004-of-00005.safetensors", "model.transformer.blocks.34.self_attn.att_proj.weight": "model-00004-of-00005.safetensors", "model.transformer.blocks.34.self_attn.attn_out.weight": "model-00004-of-00005.safetensors", "model.transformer.blocks.34.self_attn.k_norm.weight": "model-00004-of-00005.safetensors", "model.transformer.blocks.34.self_attn.q_norm.weight": "model-00004-of-00005.safetensors", "model.transformer.blocks.35.attn_norm.weight": "model-00004-of-00005.safetensors", "model.transformer.blocks.35.ff_norm.weight": "model-00004-of-00005.safetensors", "model.transformer.blocks.35.mlp.ff_out.weight": "model-00004-of-00005.safetensors", "model.transformer.blocks.35.mlp.ff_proj.weight": "model-00004-of-00005.safetensors", "model.transformer.blocks.35.self_attn.att_proj.weight": "model-00004-of-00005.safetensors", "model.transformer.blocks.35.self_attn.attn_out.weight": "model-00004-of-00005.safetensors", "model.transformer.blocks.35.self_attn.k_norm.weight": "model-00004-of-00005.safetensors", "model.transformer.blocks.35.self_attn.q_norm.weight": "model-00004-of-00005.safetensors", "model.transformer.blocks.4.attn_norm.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.4.ff_norm.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.4.mlp.ff_out.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.4.mlp.ff_proj.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.4.self_attn.att_proj.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.4.self_attn.attn_out.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.4.self_attn.k_norm.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.4.self_attn.q_norm.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.5.attn_norm.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.5.ff_norm.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.5.mlp.ff_out.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.5.mlp.ff_proj.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.5.self_attn.att_proj.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.5.self_attn.attn_out.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.5.self_attn.k_norm.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.5.self_attn.q_norm.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.6.attn_norm.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.6.ff_norm.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.6.mlp.ff_out.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.6.mlp.ff_proj.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.6.self_attn.att_proj.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.6.self_attn.attn_out.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.6.self_attn.k_norm.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.6.self_attn.q_norm.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.7.attn_norm.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.7.ff_norm.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.7.mlp.ff_out.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.7.mlp.ff_proj.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.7.self_attn.att_proj.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.7.self_attn.attn_out.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.7.self_attn.k_norm.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.7.self_attn.q_norm.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.8.attn_norm.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.8.ff_norm.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.8.mlp.ff_out.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.8.mlp.ff_proj.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.8.self_attn.att_proj.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.8.self_attn.attn_out.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.8.self_attn.k_norm.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.8.self_attn.q_norm.weight": "model-00001-of-00005.safetensors", "model.transformer.blocks.9.attn_norm.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.9.ff_norm.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.9.mlp.ff_out.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.9.mlp.ff_proj.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.9.self_attn.att_proj.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.9.self_attn.attn_out.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.9.self_attn.k_norm.weight": "model-00002-of-00005.safetensors", "model.transformer.blocks.9.self_attn.q_norm.weight": "model-00002-of-00005.safetensors", "model.transformer.ln_f.weight": "model-00004-of-00005.safetensors", "model.transformer.rotary_emb.inv_freq": "model-00004-of-00005.safetensors", "model.transformer.wte.embedding": "model-00001-of-00005.safetensors", "model.transformer.wte.new_embedding": "model-00001-of-00005.safetensors", "model.vision_backbone.image_pooling_2d.wk.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_pooling_2d.wk.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_pooling_2d.wo.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_pooling_2d.wo.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_pooling_2d.wq.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_pooling_2d.wq.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_pooling_2d.wv.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_pooling_2d.wv.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_projector.w1.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_projector.w2.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_projector.w3.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.patch_embedding.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.patch_embedding.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.positional_embedding": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.0.attention.wk.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.0.attention.wk.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.0.attention.wo.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.0.attention.wo.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.0.attention.wq.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.0.attention.wq.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.0.attention.wv.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.0.attention.wv.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.0.attention_norm.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.0.attention_norm.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.0.feed_forward.w1.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.0.feed_forward.w1.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.0.feed_forward.w2.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.0.feed_forward.w2.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.0.ffn_norm.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.0.ffn_norm.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.1.attention.wk.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.1.attention.wk.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.1.attention.wo.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.1.attention.wo.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.1.attention.wq.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.1.attention.wq.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.1.attention.wv.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.1.attention.wv.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.1.attention_norm.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.1.attention_norm.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.1.feed_forward.w1.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.1.feed_forward.w1.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.1.feed_forward.w2.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.1.feed_forward.w2.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.1.ffn_norm.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.1.ffn_norm.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.10.attention.wk.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.10.attention.wk.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.10.attention.wo.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.10.attention.wo.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.10.attention.wq.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.10.attention.wq.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.10.attention.wv.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.10.attention.wv.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.10.attention_norm.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.10.attention_norm.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.10.feed_forward.w1.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.10.feed_forward.w1.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.10.feed_forward.w2.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.10.feed_forward.w2.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.10.ffn_norm.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.10.ffn_norm.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.11.attention.wk.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.11.attention.wk.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.11.attention.wo.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.11.attention.wo.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.11.attention.wq.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.11.attention.wq.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.11.attention.wv.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.11.attention.wv.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.11.attention_norm.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.11.attention_norm.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.11.feed_forward.w1.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.11.feed_forward.w1.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.11.feed_forward.w2.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.11.feed_forward.w2.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.11.ffn_norm.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.11.ffn_norm.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.12.attention.wk.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.12.attention.wk.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.12.attention.wo.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.12.attention.wo.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.12.attention.wq.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.12.attention.wq.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.12.attention.wv.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.12.attention.wv.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.12.attention_norm.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.12.attention_norm.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.12.feed_forward.w1.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.12.feed_forward.w1.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.12.feed_forward.w2.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.12.feed_forward.w2.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.12.ffn_norm.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.12.ffn_norm.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.13.attention.wk.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.13.attention.wk.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.13.attention.wo.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.13.attention.wo.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.13.attention.wq.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.13.attention.wq.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.13.attention.wv.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.13.attention.wv.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.13.attention_norm.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.13.attention_norm.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.13.feed_forward.w1.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.13.feed_forward.w1.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.13.feed_forward.w2.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.13.feed_forward.w2.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.13.ffn_norm.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.13.ffn_norm.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.14.attention.wk.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.14.attention.wk.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.14.attention.wo.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.14.attention.wo.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.14.attention.wq.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.14.attention.wq.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.14.attention.wv.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.14.attention.wv.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.14.attention_norm.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.14.attention_norm.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.14.feed_forward.w1.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.14.feed_forward.w1.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.14.feed_forward.w2.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.14.feed_forward.w2.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.14.ffn_norm.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.14.ffn_norm.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.15.attention.wk.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.15.attention.wk.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.15.attention.wo.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.15.attention.wo.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.15.attention.wq.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.15.attention.wq.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.15.attention.wv.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.15.attention.wv.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.15.attention_norm.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.15.attention_norm.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.15.feed_forward.w1.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.15.feed_forward.w1.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.15.feed_forward.w2.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.15.feed_forward.w2.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.15.ffn_norm.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.15.ffn_norm.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.16.attention.wk.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.16.attention.wk.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.16.attention.wo.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.16.attention.wo.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.16.attention.wq.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.16.attention.wq.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.16.attention.wv.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.16.attention.wv.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.16.attention_norm.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.16.attention_norm.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.16.feed_forward.w1.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.16.feed_forward.w1.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.16.feed_forward.w2.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.16.feed_forward.w2.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.16.ffn_norm.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.16.ffn_norm.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.17.attention.wk.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.17.attention.wk.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.17.attention.wo.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.17.attention.wo.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.17.attention.wq.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.17.attention.wq.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.17.attention.wv.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.17.attention.wv.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.17.attention_norm.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.17.attention_norm.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.17.feed_forward.w1.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.17.feed_forward.w1.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.17.feed_forward.w2.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.17.feed_forward.w2.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.17.ffn_norm.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.17.ffn_norm.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.18.attention.wk.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.18.attention.wk.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.18.attention.wo.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.18.attention.wo.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.18.attention.wq.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.18.attention.wq.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.18.attention.wv.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.18.attention.wv.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.18.attention_norm.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.18.attention_norm.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.18.feed_forward.w1.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.18.feed_forward.w1.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.18.feed_forward.w2.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.18.feed_forward.w2.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.18.ffn_norm.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.18.ffn_norm.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.19.attention.wk.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.19.attention.wk.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.19.attention.wo.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.19.attention.wo.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.19.attention.wq.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.19.attention.wq.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.19.attention.wv.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.19.attention.wv.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.19.attention_norm.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.19.attention_norm.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.19.feed_forward.w1.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.19.feed_forward.w1.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.19.feed_forward.w2.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.19.feed_forward.w2.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.19.ffn_norm.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.19.ffn_norm.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.2.attention.wk.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.2.attention.wk.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.2.attention.wo.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.2.attention.wo.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.2.attention.wq.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.2.attention.wq.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.2.attention.wv.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.2.attention.wv.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.2.attention_norm.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.2.attention_norm.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.2.feed_forward.w1.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.2.feed_forward.w1.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.2.feed_forward.w2.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.2.feed_forward.w2.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.2.ffn_norm.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.2.ffn_norm.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.20.attention.wk.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.20.attention.wk.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.20.attention.wo.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.20.attention.wo.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.20.attention.wq.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.20.attention.wq.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.20.attention.wv.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.20.attention.wv.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.20.attention_norm.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.20.attention_norm.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.20.feed_forward.w1.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.20.feed_forward.w1.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.20.feed_forward.w2.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.20.feed_forward.w2.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.20.ffn_norm.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.20.ffn_norm.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.21.attention.wk.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.21.attention.wk.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.21.attention.wo.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.21.attention.wo.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.21.attention.wq.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.21.attention.wq.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.21.attention.wv.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.21.attention.wv.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.21.attention_norm.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.21.attention_norm.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.21.feed_forward.w1.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.21.feed_forward.w1.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.21.feed_forward.w2.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.21.feed_forward.w2.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.21.ffn_norm.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.21.ffn_norm.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.22.attention.wk.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.22.attention.wk.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.22.attention.wo.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.22.attention.wo.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.22.attention.wq.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.22.attention.wq.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.22.attention.wv.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.22.attention.wv.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.22.attention_norm.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.22.attention_norm.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.22.feed_forward.w1.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.22.feed_forward.w1.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.22.feed_forward.w2.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.22.feed_forward.w2.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.22.ffn_norm.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.22.ffn_norm.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.23.attention.wk.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.23.attention.wk.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.23.attention.wo.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.23.attention.wo.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.23.attention.wq.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.23.attention.wq.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.23.attention.wv.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.23.attention.wv.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.23.attention_norm.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.23.attention_norm.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.23.feed_forward.w1.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.23.feed_forward.w1.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.23.feed_forward.w2.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.23.feed_forward.w2.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.23.ffn_norm.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.23.ffn_norm.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.24.attention.wk.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.24.attention.wk.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.24.attention.wo.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.24.attention.wo.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.24.attention.wq.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.24.attention.wq.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.24.attention.wv.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.24.attention.wv.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.24.attention_norm.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.24.attention_norm.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.24.feed_forward.w1.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.24.feed_forward.w1.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.24.feed_forward.w2.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.24.feed_forward.w2.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.24.ffn_norm.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.24.ffn_norm.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.3.attention.wk.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.3.attention.wk.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.3.attention.wo.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.3.attention.wo.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.3.attention.wq.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.3.attention.wq.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.3.attention.wv.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.3.attention.wv.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.3.attention_norm.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.3.attention_norm.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.3.feed_forward.w1.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.3.feed_forward.w1.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.3.feed_forward.w2.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.3.feed_forward.w2.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.3.ffn_norm.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.3.ffn_norm.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.4.attention.wk.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.4.attention.wk.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.4.attention.wo.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.4.attention.wo.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.4.attention.wq.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.4.attention.wq.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.4.attention.wv.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.4.attention.wv.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.4.attention_norm.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.4.attention_norm.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.4.feed_forward.w1.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.4.feed_forward.w1.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.4.feed_forward.w2.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.4.feed_forward.w2.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.4.ffn_norm.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.4.ffn_norm.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.5.attention.wk.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.5.attention.wk.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.5.attention.wo.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.5.attention.wo.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.5.attention.wq.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.5.attention.wq.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.5.attention.wv.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.5.attention.wv.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.5.attention_norm.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.5.attention_norm.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.5.feed_forward.w1.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.5.feed_forward.w1.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.5.feed_forward.w2.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.5.feed_forward.w2.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.5.ffn_norm.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.5.ffn_norm.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.6.attention.wk.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.6.attention.wk.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.6.attention.wo.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.6.attention.wo.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.6.attention.wq.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.6.attention.wq.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.6.attention.wv.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.6.attention.wv.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.6.attention_norm.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.6.attention_norm.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.6.feed_forward.w1.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.6.feed_forward.w1.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.6.feed_forward.w2.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.6.feed_forward.w2.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.6.ffn_norm.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.6.ffn_norm.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.7.attention.wk.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.7.attention.wk.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.7.attention.wo.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.7.attention.wo.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.7.attention.wq.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.7.attention.wq.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.7.attention.wv.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.7.attention.wv.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.7.attention_norm.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.7.attention_norm.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.7.feed_forward.w1.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.7.feed_forward.w1.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.7.feed_forward.w2.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.7.feed_forward.w2.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.7.ffn_norm.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.7.ffn_norm.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.8.attention.wk.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.8.attention.wk.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.8.attention.wo.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.8.attention.wo.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.8.attention.wq.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.8.attention.wq.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.8.attention.wv.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.8.attention.wv.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.8.attention_norm.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.8.attention_norm.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.8.feed_forward.w1.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.8.feed_forward.w1.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.8.feed_forward.w2.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.8.feed_forward.w2.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.8.ffn_norm.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.8.ffn_norm.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.9.attention.wk.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.9.attention.wk.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.9.attention.wo.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.9.attention.wo.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.9.attention.wq.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.9.attention.wq.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.9.attention.wv.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.9.attention.wv.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.9.attention_norm.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.9.attention_norm.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.9.feed_forward.w1.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.9.feed_forward.w1.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.9.feed_forward.w2.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.9.feed_forward.w2.weight": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.9.ffn_norm.bias": "model-00004-of-00005.safetensors", "model.vision_backbone.image_vit.transformer.resblocks.9.ffn_norm.weight": "model-00004-of-00005.safetensors" } }