sumeru-i / modeling_sumeru.py
AgeOfAiTeam's picture
update model files and readme
01019b9 verified
Raw
History Blame Contribute Delete
867 Bytes
"""Sumeru model class — thin wrapper over Gemma 4 architecture.
Copyright (c) 2026 Sumeru AI. Licensed under Apache 2.0.
Usage:
from transformers import AutoModelForCausalLM, AutoProcessor
processor = AutoProcessor.from_pretrained("debowd/sumeru-i", trust_remote_code=True)
model = AutoModelForCausalLM.from_pretrained("debowd/sumeru-i", trust_remote_code=True)
"""
from transformers import Gemma4ForConditionalGeneration
from .configuration_sumeru import SumeruConfig
class SumeruForCausalLM(Gemma4ForConditionalGeneration):
"""Sumeru causal language model.
Sumeru is a family of small language models built by Sumeru AI for
Indian education — math, science, NCERT curriculum, JEE and NEET prep.
"""
config_class = SumeruConfig
def __init__(self, config):
super().__init__(config)
self.post_init()