Spaces:

hayas
/

CAT-Translate-7b

Running on Zero

App Files Files Community

hayas commited on Mar 2

Commit

c8619d3

1 Parent(s): 8f7d8ef

Add files

Browse files

Files changed (7) hide show

.python-version +1 -0
README.md +2 -1
app.py +151 -0
pyproject.toml +59 -0
requirements.txt +305 -0
style.css +4 -0
uv.lock +0 -0

.python-version ADDED Viewed

	@@ -0,0 +1 @@


1	+ 3.12

README.md CHANGED Viewed

@@ -1,10 +1,11 @@
 ---
 title: CAT Translate 7b
-emoji: 🦀
 colorFrom: indigo
 colorTo: yellow
 sdk: gradio
 sdk_version: 6.8.0
 app_file: app.py
 pinned: false
 ---

 ---
 title: CAT Translate 7b
+emoji: 🐱
 colorFrom: indigo
 colorTo: yellow
 sdk: gradio
 sdk_version: 6.8.0
+python_version: "3.12.12"
 app_file: app.py
 pinned: false
 ---

app.py ADDED Viewed

	@@ -0,0 +1,151 @@

+#!/usr/bin/env python
+import os
+import gradio as gr
+import spaces
+import torch
+from transformers import AutoModelForCausalLM, AutoTokenizer
+MAX_NEW_TOKENS_LIMIT = int(os.getenv("MAX_NEW_TOKENS_LIMIT", "2000"))
+MAX_NEW_TOKENS_DEFAULT = int(os.getenv("MAX_NEW_TOKENS_DEFAULT", "500"))
+MAX_TOTAL_TOKENS = int(os.getenv("MAX_TOTAL_TOKENS", "8192"))
+MODEL_ID = "cyberagent/CAT-Translate-7b"
+tokenizer = AutoTokenizer.from_pretrained(MODEL_ID)
+model = AutoModelForCausalLM.from_pretrained(MODEL_ID, torch_dtype=torch.bfloat16, device_map="auto")
+PROMPT_TEMPLATE = "Translate the following {src_lang} text into {tgt_lang}.\n\n{src_text}"
+DIRECTION_LANGS: dict[str, tuple[str, str]] = {
+    "Japanese → English": ("Japanese", "English"),
+    "English → Japanese": ("English", "Japanese"),
+}
+DEFAULT_DIRECTION = "Japanese → English"
+def _build_messages(text: str, direction: str) -> list[dict]:
+    src_lang, tgt_lang = DIRECTION_LANGS[direction]
+    content = PROMPT_TEMPLATE.format(src_lang=src_lang, tgt_lang=tgt_lang, src_text=text)
+    return [{"role": "user", "content": content}]
+def count_tokens(text: str, direction: str) -> str:
+    """Count input tokens without GPU. Returns a short info string."""
+    if not text:
+        return ""
+    messages = _build_messages(text, direction)
+    input_ids = tokenizer.apply_chat_template(messages, tokenize=True, add_generation_prompt=True, return_dict=False)
+    return f"Input tokens: {len(input_ids)}"
+@spaces.GPU(duration=60)
+@torch.inference_mode()
+def translate(text: str, direction: str, max_new_tokens: int) -> str:
+    if not text:
+        raise gr.Error("Please enter text to translate")
+    messages = _build_messages(text, direction)
+    inputs = tokenizer.apply_chat_template(
+        messages, tokenize=True, add_generation_prompt=True, return_dict=True, return_tensors="pt"
+    ).to(model.device)
+    input_len = len(inputs["input_ids"][0])
+    if input_len + max_new_tokens > MAX_TOTAL_TOKENS:
+        error_message = (
+            f"Input ({input_len} tokens) + max output ({max_new_tokens} tokens)"
+            f" exceeds the total limit of {MAX_TOTAL_TOKENS} tokens."
+        )
+        raise gr.Error(error_message)
+    generation = model.generate(**inputs, do_sample=False, max_new_tokens=max_new_tokens, use_cache=True)
+    generation = generation[0][input_len:]
+    return tokenizer.decode(generation, skip_special_tokens=True)
+with gr.Blocks() as demo:
+    gr.Markdown("# CAT-Translate-7b")
+    direction = gr.Radio(
+        label="Translation Direction",
+        choices=list(DIRECTION_LANGS.keys()),
+        value=DEFAULT_DIRECTION,
+    )
+    max_new_tokens = gr.Slider(
+        label="Max New Tokens",
+        info="Higher values allow longer translations but take more time",
+        minimum=50,
+        maximum=MAX_NEW_TOKENS_LIMIT,
+        step=10,
+        value=MAX_NEW_TOKENS_DEFAULT,
+    )
+    with gr.Row():
+        with gr.Column():
+            text = gr.Textbox(label="Input", lines=10, placeholder="Enter text to translate")
+            token_info = gr.Textbox(label="Token Count", lines=1)
+            translate_button = gr.Button("Translate", variant="primary")
+        with gr.Column():
+            output = gr.Textbox(label="Translation", lines=10, placeholder="Translation will appear here")
+    token_count_inputs = [text, direction]
+    for component in token_count_inputs:
+        component.change(fn=count_tokens, inputs=token_count_inputs, outputs=token_info)
+    translate_button.click(
+        fn=translate,
+        inputs=[text, direction, max_new_tokens],
+        outputs=output,
+    )
+    def translate_example(text: str, direction: str) -> str:
+        return translate(text, direction, MAX_NEW_TOKENS_DEFAULT)
+    gr.Examples(
+        label="Short examples",
+        examples=[
+            ["今日はいい天気ですね。", "Japanese → English"],
+            ["東京は世界で最も人口の多い都市の一つです。", "Japanese → English"],
+            ["The cherry blossoms are beautiful this year.", "English → Japanese"],
+            ["Technology is changing how we communicate with each other.", "English → Japanese"],
+        ],
+        inputs=[text, direction],
+        outputs=output,
+        fn=translate_example,
+    )
+    gr.Examples(
+        label="Long examples",
+        examples=[
+            [
+                "近年、大規模言語モデルの発展により、機械翻訳の品質は飛躍的に向上した。"
+                "従来の統計ベースの手法では、文脈を十分に考慮することが難しく、"
+                "長文になるほど翻訳精度が低下する傾向があった。"
+                "しかし、Transformerアーキテクチャの登場以降、"
+                "文全体の意味を捉えた上で自然な訳文を生成することが可能になりつつある。"
+                "特に、日本語と英語のように語順や文法構造が大きく異��る言語対においては、"
+                "この進歩の恩恵は顕著である。"
+                "一方で、専門用語や文化的なニュアンスの翻訳には依然として課題が残されており、"
+                "人間の翻訳者との協働が重要視されている。",
+                "Japanese → English",
+            ],
+            [
+                "The rapid advancement of artificial intelligence has fundamentally transformed "
+                "how software is developed, tested, and deployed. Modern development teams "
+                "increasingly rely on AI-powered tools for code generation, automated testing, "
+                "and even architectural design decisions. While these tools have dramatically "
+                "improved productivity, they also introduce new challenges around code quality, "
+                "security vulnerabilities, and the need for human oversight. The most effective "
+                "approach appears to be a collaborative one, where AI handles repetitive and "
+                "boilerplate tasks while human developers focus on creative problem-solving, "
+                "system design, and ensuring that the generated code aligns with business "
+                "requirements and ethical standards.",
+                "English → Japanese",
+            ],
+        ],
+        inputs=[text, direction],
+        outputs=output,
+        fn=translate_example,
+    )
+if __name__ == "__main__":
+    demo.launch(css_paths="style.css")

pyproject.toml ADDED Viewed

	@@ -0,0 +1,59 @@

+[project]
+name = "cat-translate-7b"
+version = "0.1.0"
+description = "Add your description here"
+readme = "README.md"
+requires-python = ">=3.12"
+dependencies = [
+    "accelerate>=1.12.0",
+    "gradio>=6.8.0",
+    "spaces>=0.47.0",
+    "torch==2.9.1",
+    "transformers>=5.2.0",
+]
+[tool.ruff]
+line-length = 119
+[tool.ruff.lint]
+select = ["ALL"]
+ignore = [
+    "COM812", # missing-trailing-comma
+    "D203",   # one-blank-line-before-class
+    "D213",   # multi-line-summary-second-line
+    "E501",   # line-too-long
+    "SIM117", # multiple-with-statements
+    #
+    "D100",    # undocumented-public-module
+    "D101",    # undocumented-public-class
+    "D102",    # undocumented-public-method
+    "D103",    # undocumented-public-function
+    "D104",    # undocumented-public-package
+    "D105",    # undocumented-magic-method
+    "D107",    # undocumented-public-init
+    "EM101",   # raw-string-in-exception
+    "FBT001",  # boolean-type-hint-positional-argument
+    "FBT002",  # boolean-default-value-positional-argument
+    "ISC001",  # single-line-implicit-string-concatenation
+    "PGH003",  # blanket-type-ignore
+    "PLR0913", # too-many-arguments
+    "PLR0915", # too-many-statements
+    "TRY003",  # raise-vanilla-args
+]
+unfixable = [
+    "F401", # unused-import
+]
+[tool.ruff.lint.pydocstyle]
+convention = "google"
+[tool.ruff.format]
+docstring-code-format = true
+[dependency-groups]
+dev = [
+    "ruff>=0.15.4",
+]
+hf-spaces = [
+    "datasets",
+]

requirements.txt ADDED Viewed

	@@ -0,0 +1,305 @@

+# This file was autogenerated by uv via the following command:
+#    uv export --no-hashes --no-dev --group hf-spaces --no-emit-package typer-slim -o requirements.txt
+accelerate==1.12.0
+    # via cat-translate-7b
+aiofiles==24.1.0
+    # via gradio
+aiohappyeyeballs==2.6.1
+    # via aiohttp
+aiohttp==3.13.3
+    # via fsspec
+aiosignal==1.4.0
+    # via aiohttp
+annotated-doc==0.0.4
+    # via
+    #   fastapi
+    #   typer
+annotated-types==0.7.0
+    # via pydantic
+anyio==4.12.1
+    # via
+    #   gradio
+    #   httpx
+    #   starlette
+attrs==25.4.0
+    # via aiohttp
+audioop-lts==0.2.2 ; python_full_version >= '3.13'
+    # via gradio
+brotli==1.2.0
+    # via gradio
+certifi==2026.2.25
+    # via
+    #   httpcore
+    #   httpx
+    #   requests
+charset-normalizer==3.4.4
+    # via requests
+click==8.3.1
+    # via
+    #   typer
+    #   uvicorn
+colorama==0.4.6 ; sys_platform == 'win32'
+    # via
+    #   click
+    #   tqdm
+datasets==4.6.1
+dill==0.4.0
+    # via
+    #   datasets
+    #   multiprocess
+fastapi==0.135.1
+    # via gradio
+ffmpy==1.0.0
+    # via gradio
+filelock==3.25.0
+    # via
+    #   datasets
+    #   huggingface-hub
+    #   torch
+frozenlist==1.8.0
+    # via
+    #   aiohttp
+    #   aiosignal
+fsspec==2026.2.0
+    # via
+    #   datasets
+    #   gradio-client
+    #   huggingface-hub
+    #   torch
+gradio==6.8.0
+    # via
+    #   cat-translate-7b
+    #   spaces
+gradio-client==2.2.0
+    # via gradio
+groovy==0.1.2
+    # via gradio
+h11==0.16.0
+    # via
+    #   httpcore
+    #   uvicorn
+hf-xet==1.3.2 ; platform_machine == 'AMD64' or platform_machine == 'aarch64' or platform_machine == 'amd64' or platform_machine == 'arm64' or platform_machine == 'x86_64'
+    # via huggingface-hub
+httpcore==1.0.9
+    # via httpx
+httpx==0.28.1
+    # via
+    #   datasets
+    #   gradio
+    #   gradio-client
+    #   huggingface-hub
+    #   safehttpx
+    #   spaces
+huggingface-hub==1.5.0
+    # via
+    #   accelerate
+    #   datasets
+    #   gradio
+    #   gradio-client
+    #   tokenizers
+    #   transformers
+idna==3.11
+    # via
+    #   anyio
+    #   httpx
+    #   requests
+    #   yarl
+jinja2==3.1.6
+    # via
+    #   gradio
+    #   torch
+markdown-it-py==4.0.0
+    # via rich
+markupsafe==3.0.3
+    # via
+    #   gradio
+    #   jinja2
+mdurl==0.1.2
+    # via markdown-it-py
+mpmath==1.3.0
+    # via sympy
+multidict==6.7.1
+    # via
+    #   aiohttp
+    #   yarl
+multiprocess==0.70.18
+    # via datasets
+networkx==3.6.1
+    # via torch
+numpy==2.4.2
+    # via
+    #   accelerate
+    #   datasets
+    #   gradio
+    #   pandas
+    #   transformers
+nvidia-cublas-cu12==12.8.4.1 ; platform_machine == 'x86_64' and sys_platform == 'linux'
+    # via
+    #   nvidia-cudnn-cu12
+    #   nvidia-cusolver-cu12
+    #   torch
+nvidia-cuda-cupti-cu12==12.8.90 ; platform_machine == 'x86_64' and sys_platform == 'linux'
+    # via torch
+nvidia-cuda-nvrtc-cu12==12.8.93 ; platform_machine == 'x86_64' and sys_platform == 'linux'
+    # via torch
+nvidia-cuda-runtime-cu12==12.8.90 ; platform_machine == 'x86_64' and sys_platform == 'linux'
+    # via torch
+nvidia-cudnn-cu12==9.10.2.21 ; platform_machine == 'x86_64' and sys_platform == 'linux'
+    # via torch
+nvidia-cufft-cu12==11.3.3.83 ; platform_machine == 'x86_64' and sys_platform == 'linux'
+    # via torch
+nvidia-cufile-cu12==1.13.1.3 ; platform_machine == 'x86_64' and sys_platform == 'linux'
+    # via torch
+nvidia-curand-cu12==10.3.9.90 ; platform_machine == 'x86_64' and sys_platform == 'linux'
+    # via torch
+nvidia-cusolver-cu12==11.7.3.90 ; platform_machine == 'x86_64' and sys_platform == 'linux'
+    # via torch
+nvidia-cusparse-cu12==12.5.8.93 ; platform_machine == 'x86_64' and sys_platform == 'linux'
+    # via
+    #   nvidia-cusolver-cu12
+    #   torch
+nvidia-cusparselt-cu12==0.7.1 ; platform_machine == 'x86_64' and sys_platform == 'linux'
+    # via torch
+nvidia-nccl-cu12==2.27.5 ; platform_machine == 'x86_64' and sys_platform == 'linux'
+    # via torch
+nvidia-nvjitlink-cu12==12.8.93 ; platform_machine == 'x86_64' and sys_platform == 'linux'
+    # via
+    #   nvidia-cufft-cu12
+    #   nvidia-cusolver-cu12
+    #   nvidia-cusparse-cu12
+    #   torch
+nvidia-nvshmem-cu12==3.3.20 ; platform_machine == 'x86_64' and sys_platform == 'linux'
+    # via torch
+nvidia-nvtx-cu12==12.8.90 ; platform_machine == 'x86_64' and sys_platform == 'linux'
+    # via torch
+orjson==3.11.7
+    # via gradio
+packaging==26.0
+    # via
+    #   accelerate
+    #   datasets
+    #   gradio
+    #   gradio-client
+    #   huggingface-hub
+    #   spaces
+    #   transformers
+pandas==3.0.1
+    # via
+    #   datasets
+    #   gradio
+pillow==12.1.1
+    # via gradio
+propcache==0.4.1
+    # via
+    #   aiohttp
+    #   yarl
+psutil==5.9.8
+    # via
+    #   accelerate
+    #   spaces
+pyarrow==23.0.1
+    # via datasets
+pydantic==2.12.5
+    # via
+    #   fastapi
+    #   gradio
+    #   spaces
+pydantic-core==2.41.5
+    # via pydantic
+pydub==0.25.1
+    # via gradio
+pygments==2.19.2
+    # via rich
+python-dateutil==2.9.0.post0
+    # via pandas
+python-multipart==0.0.22
+    # via gradio
+pytz==2025.2
+    # via gradio
+pyyaml==6.0.3
+    # via
+    #   accelerate
+    #   datasets
+    #   gradio
+    #   huggingface-hub
+    #   transformers
+regex==2026.2.28
+    # via transformers
+requests==2.32.5
+    # via
+    #   datasets
+    #   spaces
+rich==14.3.3
+    # via typer
+safehttpx==0.1.7
+    # via gradio
+safetensors==0.7.0
+    # via
+    #   accelerate
+    #   transformers
+semantic-version==2.10.0
+    # via gradio
+setuptools==82.0.0
+    # via torch
+shellingham==1.5.4
+    # via typer
+six==1.17.0
+    # via python-dateutil
+spaces==0.47.0
+    # via cat-translate-7b
+starlette==0.52.1
+    # via
+    #   fastapi
+    #   gradio
+sympy==1.14.0
+    # via torch
+tokenizers==0.22.2
+    # via transformers
+tomlkit==0.13.3
+    # via gradio
+torch==2.9.1
+    # via
+    #   accelerate
+    #   cat-translate-7b
+tqdm==4.67.3
+    # via
+    #   datasets
+    #   huggingface-hub
+    #   transformers
+transformers==5.2.0
+    # via cat-translate-7b
+triton==3.5.1 ; platform_machine == 'x86_64' and sys_platform == 'linux'
+    # via torch
+typer==0.24.1
+    # via
+    #   gradio
+    #   huggingface-hub
+    #   typer-slim
+typing-extensions==4.15.0
+    # via
+    #   aiosignal
+    #   anyio
+    #   fastapi
+    #   gradio
+    #   gradio-client
+    #   huggingface-hub
+    #   pydantic
+    #   pydantic-core
+    #   spaces
+    #   starlette
+    #   torch
+    #   typing-inspection
+typing-inspection==0.4.2
+    # via
+    #   fastapi
+    #   pydantic
+tzdata==2025.3 ; sys_platform == 'emscripten' or sys_platform == 'win32'
+    # via pandas
+urllib3==2.6.3
+    # via requests
+uvicorn==0.41.0
+    # via gradio
+xxhash==3.6.0
+    # via datasets
+yarl==1.23.0
+    # via aiohttp

style.css ADDED Viewed

	@@ -0,0 +1,4 @@

+h1 {
+  text-align: center;
+  display: block;
+}

uv.lock ADDED Viewed

The diff for this file is too large to render. See raw diff