data: tokenizer: name: huggingface path: google/gemma-2-2b