Commit ·
f74ac89
1
Parent(s): ad3e6b2
Update demo
Browse files- app.py +15 -0
- requirements.txt +2 -0
app.py
CHANGED
|
@@ -128,6 +128,20 @@ HERO_BADGES = f"""
|
|
| 128 |
</div>
|
| 129 |
</div>
|
| 130 |
"""
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 131 |
APP_CSS = """
|
| 132 |
:root {
|
| 133 |
--font-sans: ui-sans-serif, system-ui, sans-serif,
|
|
@@ -534,6 +548,7 @@ with gr.Blocks(css=APP_CSS, theme=gr.themes.Soft(primary_hue="teal", secondary_h
|
|
| 534 |
</div>
|
| 535 |
"""
|
| 536 |
)
|
|
|
|
| 537 |
|
| 538 |
with gr.Tabs(elem_classes="tab-nav"):
|
| 539 |
with gr.Row(elem_classes="panel-row"):
|
|
|
|
| 128 |
</div>
|
| 129 |
</div>
|
| 130 |
"""
|
| 131 |
+
MODEL_GUIDE = """
|
| 132 |
+
### This Model Is Best For
|
| 133 |
+
|
| 134 |
+
- Standard audio QA and instruction following across speech, sound, and music
|
| 135 |
+
- Assistant-style long-audio understanding with direct answers and follow-up chat
|
| 136 |
+
- Speech tasks such as ASR, paralinguistic understanding, and multilingual AST / speech translation
|
| 137 |
+
- Broad music captioning and audio description when you want an answer rather than a dense caption
|
| 138 |
+
|
| 139 |
+
If you need the most detailed long-form captions or timestamp-heavy scene breakdowns, use
|
| 140 |
+
[Audio Flamingo Next Captioner](https://huggingface.co/spaces/nvidia/audio-flamingo-next-captioner).
|
| 141 |
+
|
| 142 |
+
If you need explicit step-by-step timestamp-grounded reasoning traces, use
|
| 143 |
+
[Audio Flamingo Next Think](https://huggingface.co/spaces/nvidia/audio-flamingo-next-think).
|
| 144 |
+
"""
|
| 145 |
APP_CSS = """
|
| 146 |
:root {
|
| 147 |
--font-sans: ui-sans-serif, system-ui, sans-serif,
|
|
|
|
| 548 |
</div>
|
| 549 |
"""
|
| 550 |
)
|
| 551 |
+
gr.Markdown(MODEL_GUIDE)
|
| 552 |
|
| 553 |
with gr.Tabs(elem_classes="tab-nav"):
|
| 554 |
with gr.Row(elem_classes="panel-row"):
|
requirements.txt
CHANGED
|
@@ -1,3 +1,5 @@
|
|
|
|
|
|
|
|
| 1 |
git+https://github.com/lashahub/transformers.git@add_AudioFlamingoNext
|
| 2 |
|
| 3 |
accelerate
|
|
|
|
| 1 |
+
# Pinned demo environment. AF-Next is supported in Transformers; this
|
| 2 |
+
# branch matches the exact build used by the Space.
|
| 3 |
git+https://github.com/lashahub/transformers.git@add_AudioFlamingoNext
|
| 4 |
|
| 5 |
accelerate
|