File size: 867 Bytes
01019b9 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 | """Sumeru model class — thin wrapper over Gemma 4 architecture.
Copyright (c) 2026 Sumeru AI. Licensed under Apache 2.0.
Usage:
from transformers import AutoModelForCausalLM, AutoProcessor
processor = AutoProcessor.from_pretrained("debowd/sumeru-i", trust_remote_code=True)
model = AutoModelForCausalLM.from_pretrained("debowd/sumeru-i", trust_remote_code=True)
"""
from transformers import Gemma4ForConditionalGeneration
from .configuration_sumeru import SumeruConfig
class SumeruForCausalLM(Gemma4ForConditionalGeneration):
"""Sumeru causal language model.
Sumeru is a family of small language models built by Sumeru AI for
Indian education — math, science, NCERT curriculum, JEE and NEET prep.
"""
config_class = SumeruConfig
def __init__(self, config):
super().__init__(config)
self.post_init()
|