{ "base_model": "/data/pretrained_models/Qwen3.5-2B", "original_units": "/home/lg/workflow_tooluse/Flow_RL_luogan/temp/metamath/metamath-output/setmm-train-qwen35-4b-mixed-12000/setmm-proof-units.jsonl", "expanded_units": "/home/lg/workflow_tooluse/Flow_RL_luogan/temp/metamath/metamath-output/setmm-train-qwen35-4b-mixed-12000/setmm-expanded-units.jsonl", "output_dir": "/data/pretrained_models/Qwen3.5-2B-metamath", "merged_dir": "/data/pretrained_models/Qwen3.5-2B-metamath/merged", "train_examples": 15267, "eval_examples": 311, "skipped_examples": 422, "max_length": 6144, "direct_ref_mode": "same-file-distractors", "same_file_distractor_direct_refs": 4, "shuffle_direct_refs": true, "learning_rate": 0.0001, "lora_rank": 32, "lora_alpha": 64 }