| { | |
| "experiment": "qkv_v_only_hardnegs", | |
| "rank": 300, | |
| "d_model": 300, | |
| "vocab_size": 82741, | |
| "seq_len": 512, | |
| "batch_size": 256, | |
| "total_steps": 150000, | |
| "warmup": 1000, | |
| "lr": 0.0005, | |
| "min_lr": 1e-05, | |
| "weight_decay": 0.01, | |
| "grad_clip": 1.0, | |
| "tau": 0.05, | |
| "lambda_mse": 0.1, | |
| "H_hard_negatives_per_anchor": 64, | |
| "glove_E_repo": "jsanzolac/drifting-glove-distilled-r300", | |
| "k_lora_repo": "jsanzolac/bpe_glove_300_lora_r300_qwen3", | |
| "k_lora_path": "rank_300/checkpoint_final.pt", | |
| "hard_neg_repo": "jsanzolac/qwen3_emb_512_hard_negatives", | |
| "pack_repo": "jsanzolac/qwen3_emb_300_packed_cl100k", | |
| "created_at": "2026-05-21T16:01:51.873137" | |
| } |