English
glove
lora
distillation
hard-negatives
qkv-split
jsanzolac's picture
Upload rank_300/config.json with huggingface_hub
ee9bef9 verified
{
"experiment": "qkv_v_only_hardnegs",
"rank": 300,
"d_model": 300,
"vocab_size": 82741,
"seq_len": 512,
"batch_size": 256,
"total_steps": 150000,
"warmup": 1000,
"lr": 0.0005,
"min_lr": 1e-05,
"weight_decay": 0.01,
"grad_clip": 1.0,
"tau": 0.05,
"lambda_mse": 0.1,
"H_hard_negatives_per_anchor": 64,
"glove_E_repo": "jsanzolac/drifting-glove-distilled-r300",
"k_lora_repo": "jsanzolac/bpe_glove_300_lora_r300_qwen3",
"k_lora_path": "rank_300/checkpoint_final.pt",
"hard_neg_repo": "jsanzolac/qwen3_emb_512_hard_negatives",
"pack_repo": "jsanzolac/qwen3_emb_300_packed_cl100k",
"created_at": "2026-05-21T16:01:51.873137"
}