Spaces:

vola2004
/

age-gender-app

Build error

App Files Files Community

vola2004 commited on Oct 24, 2025

Commit

0dc3843

verified ·

1 Parent(s): 7562781

Upload 8 files

Browse files

Files changed (4) hide show

Dockerfile +11 -13
README_hf.md +43 -0
app_docker.py +114 -0
requirements_hf.txt +11 -0

Dockerfile CHANGED Viewed

@@ -1,27 +1,25 @@
 FROM python:3.9-slim
-# システムの依存関係をインストール（エラーハンドリング付き）
-RUN apt-get update && \
-    apt-get install -y --no-install-recommends \
     build-essential \
     curl \
     git \
-    && apt-get clean \
-    && rm -rf /var/lib/apt/lists/* \
-    || echo "Warning: Some packages may not have installed correctly"
-# 作業ディレクトリを設定
 WORKDIR /app
 # Pythonの依存関係をインストール
-COPY requirements.txt .
 RUN pip install --no-cache-dir -r requirements.txt
-# アプリケーションのコードをコピー
 COPY . .
-# ポート5000を公開
-EXPOSE 5000
-# アプリケーションを起動
-CMD ["python", "app.py"]

 FROM python:3.9-slim
+# システムパッケージの更新とインストール
+RUN apt-get update && apt-get install -y \
     build-essential \
     curl \
+    software-properties-common \
     git \
+    && rm -rf /var/lib/apt/lists/*
+# 作業ディレクトリの設定
 WORKDIR /app
 # Pythonの依存関係をインストール
+COPY requirements_hf.txt requirements.txt
 RUN pip install --no-cache-dir -r requirements.txt
+# アプリケーションファイルをコピー
 COPY . .
+# ポートの公開
+EXPOSE 7860
+# アプリケーションの起動
+CMD ["python", "app_docker.py"]

README_hf.md ADDED Viewed

	@@ -0,0 +1,43 @@

+---
+title: 年代・性別推定システム
+emoji: 🧠
+colorFrom: blue
+colorTo: purple
+sdk: docker
+pinned: false
+license: mit
+app_port: 7860
+---
+# 年代・性別推定システム
+日本語テキストから年代と性別を推定するAIシステムです。BERTベースのモデルを使用して、入力されたテキストの特徴から年代（10代〜60代）と性別（男性・女性）を確率で予測します。
+## 機能
+- **年代推定**: 10代、20代、30代、40代、50代、60代の6つの年代を確率で予測
+- **性別推定**: 男性・女性を確率で予測
+- **リアルタイム予測**: Webアプリケーションでリアルタイムに予測結果を表示
+## 技術仕様
+- **ベースモデル**: cl-tohoku/bert-large-japanese
+- **フレームワーク**: PyTorch, Transformers, Gradio
+- **デプロイ**: Docker on Hugging Face Spaces
+## 使用方法
+1. テキストボックスに日本語のテキストを入力
+2. 「推測実行」ボタンをクリック
+3. 年代と性別の確率が表示されます
+## モデル詳細
+- **年代モデル**: 各年代を独立した二値分類器として学習
+- **性別モデル**: 2クラス分類（男性・女性）
+- **学習データ**: 日本語テキストデータセット
+- **精度**: 年代推定 約79%、性別推定 約70%
+## ライセンス
+MIT License

app_docker.py ADDED Viewed

	@@ -0,0 +1,114 @@

+import gradio as gr
+import torch
+import os
+import gzip
+import shutil
+from predictor import load_models, predict_text
+def extract_compressed_models():
+    """圧縮されたモデルファイルを展開"""
+    try:
+        print("=== 圧縮モデルファイルの展開 ===")
+        # 圧縮ファイルを展開
+        compressed_files = [
+            ("bert_age_model.bin.gz", "bert_age_model.bin"),
+            ("bert_gender_model.bin.gz", "bert_gender_model.bin")
+        ]
+        for compressed_file, extracted_file in compressed_files:
+            if os.path.exists(compressed_file) and not os.path.exists(extracted_file):
+                print(f"📦 {compressed_file} を展開中...")
+                with gzip.open(compressed_file, 'rb') as f_in:
+                    with open(extracted_file, 'wb') as f_out:
+                        shutil.copyfileobj(f_in, f_out)
+                print(f"✅ {extracted_file} の展開が完了しました")
+            elif os.path.exists(extracted_file):
+                print(f"✅ {extracted_file} は既に存在します")
+            else:
+                print(f"❌ {compressed_file} が見つかりません")
+        return True
+    except Exception as e:
+        print(f"❌ 展開エラー: {e}")
+        return False
+def predict_age_gender(text):
+    """年代・性別予測関数"""
+    if not text.strip():
+        return "テキストを入力してください。", "", ""
+    try:
+        result = predict_text(text)
+        # 年代予測結果を整形
+        age_results = []
+        for age, percentage in result['age_percentages'].items():
+            age_results.append(f"{age}: {percentage}%")
+        age_text = "\n".join(age_results)
+        # 性別予測結果を整形
+        gender_results = []
+        for gender, percentage in result['gender_percentages'].items():
+            gender_results.append(f"{gender}: {percentage}%")
+        gender_text = "\n".join(gender_results)
+        # 最も高い確率の年代を特定
+        max_age = max(result['age_percentages'].items(), key=lambda x: x[1])
+        max_gender = max(result['gender_percentages'].items(), key=lambda x: x[1])
+        summary = f"推定結果: {max_age[0]} ({max_age[1]}%), {max_gender[0]} ({max_gender[1]}%)"
+        return summary, age_text, gender_text
+    except Exception as e:
+        return f"エラーが発生しました: {str(e)}", "", ""
+# モデルの展開と読み込み
+print("=== アプリケーション初期化 ===")
+# 圧縮ファイルを展開
+if extract_compressed_models():
+    # モデルの読み込み
+    print("=== モデル読み込み開始 ===")
+    try:
+        load_models()
+        print("✅ モデルの読み込みが完了しました")
+    except Exception as e:
+        print(f"❌ モデルの読み込みに失敗しました: {e}")
+        print("⚠️  モデルファイルが存在しない可能性があります")
+else:
+    print("❌ モデルの展開に失敗しました")
+# Gradioインターフェース
+interface = gr.Interface(
+    fn=predict_age_gender,
+    inputs=gr.Textbox(
+        label="日本語テキストを入力してください",
+        placeholder="例: 今日はとても良い天気ですね。友達と一緒に散歩をしました。",
+        lines=3
+    ),
+    outputs=[
+        gr.Textbox(label="推定結果サマリー"),
+        gr.Textbox(label="年代予測詳細"),
+        gr.Textbox(label="性別予測詳細")
+    ],
+    title="🧠 年代・性別推定システム",
+    description="日本語テキストから年代と性別を推定するAIシステムです。",
+    examples=[
+        "今日はとても良い天気ですね。",
+        "友達と一緒に散歩をしました。",
+        "新しいスマートフォンを買いました。",
+        "仕事が忙しくて疲れました。"
+    ],
+    theme=gr.themes.Soft()
+)
+# アプリケーション起動
+if __name__ == "__main__":
+    interface.launch(
+        server_name="0.0.0.0",
+        server_port=7860,
+        share=False  # Hugging Face SpacesではFalse
+    )

requirements_hf.txt ADDED Viewed

	@@ -0,0 +1,11 @@

+gradio>=4.0.0
+torch>=1.9.0
+transformers>=4.21.0
+pandas>=1.3.0
+scikit-learn>=1.0.0
+numpy>=1.21.0
+fugashi>=1.2.0
+ipadic>=1.0.0
+sudachipy>=0.6.0
+sudachidict-core>=20240101
+neologdn>=0.0.0