{ "talker": { "hidden_size": 1024, "text_hidden_size": 2048, "vocab_size": 3072, "num_hidden_layers": 28, "num_attention_heads": 16, "num_key_value_heads": 8, "head_dim": 128, "num_code_groups": 16, "codec_eos_token_id": 2150, "codec_think_id": 2154, "codec_nothink_id": 2155, "codec_think_bos_id": 2156, "codec_think_eos_id": 2157, "codec_pad_id": 2148, "codec_bos_id": 2149, "rope_theta": 1000000 }, "code_predictor": { "hidden_size": 1024, "vocab_size": 2048, "num_hidden_layers": 5, "num_attention_heads": 16, "num_key_value_heads": 8, "head_dim": 128, "rope_theta": 1000000 }, "tts": { "tts_bos_token_id": 151672, "tts_eos_token_id": 151673, "tts_pad_token_id": 151671, "im_start_token_id": 151644, "im_end_token_id": 151645 }, "language_ids": { "chinese": 2055, "english": 2050, "german": 2053, "italian": 2070, "portuguese": 2071, "spanish": 2054, "japanese": 2058, "korean": 2064, "french": 2061, "russian": 2069, "beijing_dialect": 2074, "sichuan_dialect": 2062 }, "speaker_dialect": { "serena": false, "vivian": false, "uncle_fu": false, "ryan": false, "aiden": false, "ono_anna": false, "sohee": false, "eric": "sichuan_dialect", "dylan": "beijing_dialect" } }