{ "global_step": 5000, "bucket_weights": { "aime": 4897.0, "capability": 8000.0, "chat_singleturn": 3000.0, "code_proc": 18000.0, "ifeval_proc": 528.0, "judge": 4500.0, "long_context": 17500.0, "math_proc": 27500.0, "mbpp_proc": 10000.0, "reasoning_proc": 6511.0, "tool_use_proc": 20000.0, "chat_turns": 12000.0 }, "bucket_rows": { "aime": 4897, "capability": 8000, "chat_singleturn": 3000, "code_proc": 18000, "ifeval_proc": 528, "judge": 4500, "long_context": 17500, "math_proc": 27500, "mbpp_proc": 10000, "reasoning_proc": 6511, "tool_use_proc": 20000, "chat_turns": 12000 }, "min_assistant_chars": 0, "per_row_ce": true, "per_row_ce_length_norm": true, "length_norm_cap": 256, "max_steps": 6000, "warmup_steps": 600, "lr": 2e-05, "seed": 42, "aux_coeff": 0.001, "router_lr_scale": 0.1, "aux_only": false, "phase": "sft_mixed" }