thangvip's picture
infra: CUDA build for T4 GPU + revert to base Qwen2.5-3B-Instruct
887ab1c verified
Raw
History Blame Contribute Delete
159 Bytes
from pathlib import Path
MODEL_REPO = "Qwen/Qwen2.5-3B-Instruct-GGUF"
MODEL_FILE = "qwen2.5-3b-instruct-q4_k_m.gguf"
MODEL_PATH = Path("models") / MODEL_FILE