Spaces:

RadicalNotionAI
/

modeldna

Running

trohrbaugh commited on 5 days ago

Commit

39d11b5

verified ·

1 Parent(s): 5da97e4

Add hunyuan_v3 (hy_v3) to KNOWN_BASES

Files changed (1) hide show

scan.py CHANGED Viewed

@@ -252,6 +252,13 @@ KNOWN_BASES = {
         # vocab ≈ Gemma tokenizer + 128 extra tokens; trained on AMD MI300x
         # 74B-Preview is pre-RL reasoning base (no RLHF/instruct tuning)
     },
     "mellum": {
         "name": "JetBrains Mellum (code-specialized MoE)",
         "vocab_size": 98304,

         # vocab ≈ Gemma tokenizer + 128 extra tokens; trained on AMD MI300x
         # 74B-Preview is pre-RL reasoning base (no RLHF/instruct tuning)
     },
+    "hunyuan_v3": {
+        "name": "Tencent Hunyuan V3 / Hy-MT2 (MoE)",
+        "vocab_size": 120832,
+        "model_type_patterns": ["hy_v3"],
+        # Hy-MT2 series: 1.8B dense, 7B dense, 30B-A3B MoE (128E/8A).
+        # 48 layers, hidden=2048 for MoE tier. QK norm. HYV3ForCausalLM.
+    },
     "mellum": {
         "name": "JetBrains Mellum (code-specialized MoE)",
         "vocab_size": 98304,