guzus's picture
Upload smoke DPO LoRA adapter from SGS ferrari run
312ceab verified
Raw
History Blame
547 Bytes
{
"model": "/data/screenwriter/training/outputs/sgs-smoke/sft",
"base_model": null,
"seq_len": 2048,
"load_in_4bit": false,
"beta": 0.1,
"data": "/data/screenwriter/training/outputs/_smoke_data/dpo_train.jsonl",
"eval": "/data/screenwriter/training/outputs/_smoke_data/dpo_test.jsonl",
"epochs": 1,
"batch_size": 1,
"grad_accum": 1,
"lr": 2e-05,
"warmup_steps": 0,
"max_steps": 1,
"output": "/data/screenwriter/training/outputs/sgs-smoke/dpo",
"save_steps": 1,
"logging_steps": 1,
"seed": 3407,
"wandb": false
}