English
glove
lora
distillation
bpe
cl100k_base
jsanzolac commited on
Commit
5171bc2
·
verified ·
1 Parent(s): 1996774

Upload rank_512/config.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. rank_512/config.json +20 -0
rank_512/config.json ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "variant": 1,
3
+ "rank": 512,
4
+ "d_model": 512,
5
+ "vocab_size": 90181,
6
+ "seq_len": 512,
7
+ "batch_size": 256,
8
+ "total_steps": 30000,
9
+ "warmup": 500,
10
+ "lr": 0.0005,
11
+ "min_lr": 1e-05,
12
+ "weight_decay": 0.01,
13
+ "grad_clip": 1.0,
14
+ "tau": 0.05,
15
+ "lambda_nce": 1.0,
16
+ "lambda_density": 0.1,
17
+ "teacher_model": "Qwen/Qwen3-Embedding-8B",
18
+ "teacher_max_len": 512,
19
+ "created_at": "2026-05-15T20:58:32.459093"
20
+ }