Upload locally saved GRIT fine-tuned model: open_llama_3b_v2 on Alpaca

Browse files

Files changed (6) hide show

README.md +84 -0
adapter_config.json +38 -0
adapter_model.safetensors +3 -0
special_tokens_map.json +24 -0
tokenizer.model +3 -0
tokenizer_config.json +43 -0

README.md ADDED Viewed

	@@ -0,0 +1,84 @@

+---
+tags:
+- llama3
+- alpaca
+- grit
+- lora
+- qlora
+- instruction-tuning
+- fine-tuned
+base_model: openlm-research/open_llama_3b_v2
+library_name: peft
+license: apache-2.0
+datasets:
+- tatsu-lab/alpaca
+language:
+- en
+pipeline_tag: text-generation
+---
+# OpenLlama-3B-v2 Fine-tuned with GRIT and QLoRA
+This model is a fine-tuned version of [openlm-research/open_llama_3b_v2](https://huggingface.co/openlm-research/open_llama_3b_v2) using the **GRIT** (Gradient Regularized Instruction Tuning) algorithm and **QLoRA** on the [Alpaca dataset](https://huggingface.co/datasets/tatsu-lab/alpaca).
+The base model is quantized to 4-bit (NF4) to enable efficient fine-tuning.
+## 🚀 Training Details
+### GRIT Algorithm
+- **K-FAC Updates**: Every 200 steps for second-order preconditioning
+- **Neural Reprojection**: Every 500 steps for rank optimization
+- **Optimized LoRA Modules**: attention + key MLP layers (as per design)
+### Fine-tuning Configuration
+- **Base Model**: OpenLlama 3B v2
+- **Quantization**: 4-bit (NF4) with float16 compute
+- **LoRA Rank**: 64
+- **LoRA Alpha**: 128
+- **Batch Size**: 16 (per device)
+- **Gradient Accumulation**: 4 (Effective batch = 64)
+- **Learning Rate**: 5.0e-05
+- **Precision**: bf16 mixed precision
+- **Sequence Length**: 512 tokens
+- **Gradient Checkpointing**: Enabled
+### Performance Improvements
+- ✅ **Faster Convergence**: K-FAC preconditioning aligns updates with curvature
+- ✅ **Memory-Efficient**: 4-bit quantization (QLoRA) and gradient checkpointing used.
+- ✅ **Efficient Training**: Utilizes `accelerate` for efficient training.
+## 📊 Training Metrics (sample)
+- **Total Steps**: N/A (training session interrupted)
+- **Final Loss**: N/A (training session interrupted)
+- **BLEU (val)**: N/A (training session interrupted)
+- **Trainable Params**: N/A (training session interrupted)
+## 🏷️ Model Tags
+- Instruction-tuned with GRIT and QLoRA
+- GRIT-tuned Model
+- 4-bit Quantized Model
+- LoRA rank 64
+- Mixed precision (bf16)
+- Alpaca dataset fine-tuning
+## 📝 Algorithm Details
+- **K-FAC Preconditioning** (Natural Gradient) and **Neural Reprojection** as per GRIT method
+- **Memory Efficient**: Covariance matrices on CPU to reduce GPU load
+## 🏆 Results
+In benchmark comparisons, GRIT has shown **faster convergence and better stability** than standard LoRA or fine-tuning, making it well-suited for efficient single-epoch training.
+## 📝 Citation
+If you use this model, please cite:
+```bibtex
+@misc{grit-openllama-3b-alpaca,
+  title={OpenLlama 3B v2 Fine-tuned with GRIT on Alpaca},
+  author={Pritish92},
+  year={2025},
+  publisher={Hugging Face},
+  url={https://huggingface.co/Pritish92/open-llama-3b-v2-grit-alpaca}
+}
+```
+## ⚖️ License
+This model inherits the Apache 2.0 license.

adapter_config.json ADDED Viewed

	@@ -0,0 +1,38 @@

+{
+  "alpha_pattern": {},
+  "auto_mapping": null,
+  "base_model_name_or_path": "openlm-research/open_llama_3b_v2",
+  "bias": "none",
+  "corda_config": null,
+  "eva_config": null,
+  "exclude_modules": null,
+  "fan_in_fan_out": false,
+  "inference_mode": true,
+  "init_lora_weights": true,
+  "layer_replication": null,
+  "layers_pattern": null,
+  "layers_to_transform": null,
+  "loftq_config": {},
+  "lora_alpha": 128,
+  "lora_bias": false,
+  "lora_dropout": 0.05,
+  "megatron_config": null,
+  "megatron_core": "megatron.core",
+  "modules_to_save": null,
+  "peft_type": "LORA",
+  "qalora_group_size": 16,
+  "r": 64,
+  "rank_pattern": {},
+  "revision": null,
+  "target_modules": [
+    "o_proj",
+    "v_proj",
+    "k_proj",
+    "q_proj"
+  ],
+  "task_type": "CAUSAL_LM",
+  "trainable_token_indices": null,
+  "use_dora": false,
+  "use_qalora": false,
+  "use_rslora": false
+}

adapter_model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6929a2ecf69a74e1a32c26800ef41ae3c3a117aee3db75a1b64ffc61dd7a918a
+size 170421784

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,24 @@

+{
+  "bos_token": {
+    "content": "<s>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "eos_token": {
+    "content": "</s>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": "</s>",
+  "unk_token": {
+    "content": "<unk>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  }
+}

tokenizer.model ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:91b289e85fa20fd375d8b33dc12f77616f18abc6359804471d1fafcb425fecb8
+size 511574

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,43 @@

+{
+  "add_bos_token": true,
+  "add_eos_token": false,
+  "add_prefix_space": true,
+  "added_tokens_decoder": {
+    "0": {
+      "content": "<unk>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "1": {
+      "content": "<s>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "2": {
+      "content": "</s>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "bos_token": "<s>",
+  "clean_up_tokenization_spaces": false,
+  "eos_token": "</s>",
+  "extra_special_tokens": {},
+  "legacy": true,
+  "model_max_length": 2048,
+  "pad_token": "</s>",
+  "sp_model_kwargs": {},
+  "spaces_between_special_tokens": false,
+  "tokenizer_class": "LlamaTokenizer",
+  "unk_token": "<unk>",
+  "use_default_system_prompt": false
+}