English
glove
lora
distillation
hard-negatives
qwen3-embedding
File size: 621 Bytes
35343f6
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
{
  "experiment": "r300_qwen3teacher_hardnegs",
  "rank": 300,
  "d_model": 300,
  "vocab_size": 82741,
  "seq_len": 512,
  "batch_size": 256,
  "total_steps": 150000,
  "warmup": 1000,
  "lr": 0.0005,
  "min_lr": 1e-05,
  "weight_decay": 0.01,
  "grad_clip": 1.0,
  "tau": 0.05,
  "lambda_mse": 1.0,
  "H_hard_negatives_per_anchor": 64,
  "hard_neg_repo": "jsanzolac/qwen3_emb_512_hard_negatives",
  "warm_start_repo": "jsanzolac/bpe_glove_300_lora_r300_qwen3",
  "warm_start_path": "rank_300/checkpoint_final.pt",
  "glove_repo": "jsanzolac/drifting-glove-distilled-r300",
  "created_at": "2026-05-21T14:16:30.508447"
}