Instructions to use mrinaldi/albertina_mini_alibi_7B_tokens with libraries, inference providers, notebooks, and local apps. Follow these links to get started.
- Libraries
- Transformers
How to use mrinaldi/albertina_mini_alibi_7B_tokens with Transformers:
# Load model directly from transformers import AutoModel model = AutoModel.from_pretrained("mrinaldi/albertina_mini_alibi_7B_tokens", trust_remote_code=True, dtype="auto") - Notebooks
- Google Colab
- Kaggle
File size: 1,820 Bytes
b7c976d | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 | {
"model_class": "BERTModel",
"model_config": {
"name": "Albertina_mini_alibi",
"hidden_size": 768,
"ffn_factor": 3.0,
"vocab_size": 32768,
"bos_token_id": 5,
"eos_token_id": 6,
"pad_token_id": 0,
"mask_token_id": 4,
"masked_substitution_rate": 0.2,
"cloze_probability": 1.0,
"random_probability": 0.0,
"same_probability": 0.0,
"num_hidden_layers": 6,
"num_attention_heads": 12,
"tie_word_embeddings": false,
"rms_norm_eps": 1e-06,
"attention_type": [],
"max_position_embeddings": 1024,
"block_size_for_attention": 128,
"compile_flexattn": false,
"bias": false,
"default_layer": {
"attn_impl": "flash",
"sliding_window_size": null,
"positional_encoding": "alibi",
"normalization": "rmsnorm",
"normalization_position": "pre",
"ffn_activation": "swiglu",
"hooks": {}
},
"custom_layers": {}
},
"training": {
"optimizer": "muon",
"lr_scheduling": true,
"lr": 0.0005,
"final_lr": 2e-05,
"hold_steps": 0.0,
"weight_decay": 0.01,
"scheduler": "custom",
"gradient_clip_val": 1.0,
"warmup_steps": 0.05,
"max_epochs": 1,
"accumulate_grad_batches": 16,
"seed": 27,
"save_every_n_steps": 100,
"checkpoint_name": "Albertina_mini_alibi"
},
"tokenizer": {
"type": "huggingface",
"pretrained_name": "mrinaldi/Gettone",
"varlen_strategy": "unpadding"
},
"data": {
"data_root": "/mnt/llmdata/data/Albertone_MDAT",
"batch_size": 48,
"num_workers": 1,
"mdat_strategy": "Gettone1024_",
"mdat_view": "Albertina7B",
"wanted_from_strategy": "chunked_for_recurrence"
},
"save_dir": "./checkpoints_albertina_gold",
"wandb_project": "Albertina_gold",
"wandb_run_name": "Albertina_mini_alibi"
} |