Spaces:

hysts
/

kyutai-stt-2.6b-en

Running on Zero

App Files Files Community

hysts HF Staff commited on 10 days ago

Commit

1e9d7e6

1 Parent(s): d020ce8

Fix

Browse files

Files changed (1) hide show

app.py +17 -72

app.py CHANGED Viewed

@@ -31,7 +31,7 @@ def transcribe(audio_path: str) -> str:
     """
     if not audio_path:
         return ""
     data, _ = librosa.load(audio_path, sr=SAMPLE_RATE)
     if len(data) > MAX_SAMPLE_SIZE:
         data = data[:MAX_SAMPLE_SIZE]
@@ -52,7 +52,7 @@ custom_theme = gr.themes.Soft(
     font=gr.themes.GoogleFont("Inter"),
     text_size="lg",
     spacing_size="md",
-    radius_size="lg"
 ).set(
     button_primary_background_fill="*primary_600",
     button_primary_background_fill_hover="*primary_700",
@@ -197,32 +197,24 @@ with gr.Blocks(fill_height=False) as demo:
             <p class="header-subtitle">Advanced English Audio Transcription powered by AI</p>
         </div>
     """)
     # Info banner
     gr.HTML(f"""
         <div class="info-banner">
             ℹ️ Upload or record audio in English (max {MAX_DURATION} seconds). Supports WAV, MP3, and other common formats.
         </div>
     """)
     # Main content
     with gr.Group(elem_classes="main-card"):
         # Audio input
         audio = gr.Audio(
-            label="🎵 Audio Input",
-            type="filepath",
-            sources=["upload", "microphone"],
-            elem_classes="audio-container"
         )
         # Transcribe button
-        transcribe_btn = gr.Button(
-            "✨ Transcribe Audio",
-            variant="primary",
-            size="lg",
-            elem_classes="primary-button"
-        )
         # Output
         output = gr.Textbox(
             label="📝 Transcription",
@@ -230,9 +222,9 @@ with gr.Blocks(fill_height=False) as demo:
             lines=6,
             max_lines=12,
             show_copy_button=True,
-            elem_classes="transcription-output"
         )
     # Examples section
     with gr.Group(elem_classes="examples-container"):
         gr.Markdown("### 💡 Try These Examples")
@@ -244,7 +236,7 @@ with gr.Blocks(fill_height=False) as demo:
             cache_examples=True,
             examples_per_page=5,
         )
     # Footer
     gr.HTML("""
         <div class="footer-container">
@@ -254,22 +246,12 @@ with gr.Blocks(fill_height=False) as demo:
             </p>
         </div>
     """)
     # Event handlers
-    transcribe_btn.click(
-        fn=transcribe,
-        inputs=audio,
-        outputs=output,
-        api_name="transcribe"
-    )
     # Auto-transcribe on audio upload (optional - remove if you prefer manual triggering)
-    audio.change(
-        fn=transcribe,
-        inputs=audio,
-        outputs=output,
-        show_progress="minimal"
-    )
 if __name__ == "__main__":
@@ -278,44 +260,7 @@ if __name__ == "__main__":
         css=custom_css,
         footer_links=[
             {"label": "Built with anycoder", "url": "https://huggingface.co/spaces/akhaliq/anycoder"},
-            {"label": "Model", "url": "https://huggingface.co/kyutai/stt-2.6b-en-trfs"}
         ],
-        mcp_server=True
     )
----
-## ✨ Key Improvements
-### 🎨 Modern Design
-- **Gradient header** with clean typography
-- **Card-based layout** for better visual hierarchy
-- **Soft theme** with custom blue/purple gradient accent colors
-- **Professional spacing** and rounded corners
-### 📱 Mobile-First
-- **Responsive design** that adapts to all screen sizes
-- **Optimized padding** and font sizes for mobile
-- **Touch-friendly** button sizes
-- **Max-width container** for better readability on large screens
-### 🚀 UX Enhancements
-- **Info banner** explaining max duration and supported formats
-- **Auto-transcribe** on audio upload (optional)
-- **Copy button** on transcription output
-- **Visual feedback** with hover effects on buttons
-- **Clear visual hierarchy** with icons and labels
-### 🎯 Minimal & Clean
-- **Removed unnecessary Row/Column** nesting
-- **Streamlined components** - only what's needed
-- **Better grouping** with semantic sections
-- **Professional footer** with proper attribution
-### 🔧 Technical
-- **Gradio 6 compliant** - all parameters in correct locations
-- **Custom theme** with Soft base and gradient accents
-- **Mobile-optimized CSS** with media queries
-- **Proper error handling** with empty audio check
-The redesign maintains all functionality while providing a modern, professional, mobile-friendly interface! 🎉

     """
     if not audio_path:
         return ""
     data, _ = librosa.load(audio_path, sr=SAMPLE_RATE)
     if len(data) > MAX_SAMPLE_SIZE:
         data = data[:MAX_SAMPLE_SIZE]
     font=gr.themes.GoogleFont("Inter"),
     text_size="lg",
     spacing_size="md",
+    radius_size="lg",
 ).set(
     button_primary_background_fill="*primary_600",
     button_primary_background_fill_hover="*primary_700",
             <p class="header-subtitle">Advanced English Audio Transcription powered by AI</p>
         </div>
     """)
     # Info banner
     gr.HTML(f"""
         <div class="info-banner">
             ℹ️ Upload or record audio in English (max {MAX_DURATION} seconds). Supports WAV, MP3, and other common formats.
         </div>
     """)
     # Main content
     with gr.Group(elem_classes="main-card"):
         # Audio input
         audio = gr.Audio(
+            label="🎵 Audio Input", type="filepath", sources=["upload", "microphone"], elem_classes="audio-container"
         )
         # Transcribe button
+        transcribe_btn = gr.Button("✨ Transcribe Audio", variant="primary", size="lg", elem_classes="primary-button")
         # Output
         output = gr.Textbox(
             label="📝 Transcription",
             lines=6,
             max_lines=12,
             show_copy_button=True,
+            elem_classes="transcription-output",
         )
     # Examples section
     with gr.Group(elem_classes="examples-container"):
         gr.Markdown("### 💡 Try These Examples")
             cache_examples=True,
             examples_per_page=5,
         )
     # Footer
     gr.HTML("""
         <div class="footer-container">
             </p>
         </div>
     """)
     # Event handlers
+    transcribe_btn.click(fn=transcribe, inputs=audio, outputs=output, api_name="transcribe")
     # Auto-transcribe on audio upload (optional - remove if you prefer manual triggering)
+    audio.change(fn=transcribe, inputs=audio, outputs=output, show_progress="minimal")
 if __name__ == "__main__":
         css=custom_css,
         footer_links=[
             {"label": "Built with anycoder", "url": "https://huggingface.co/spaces/akhaliq/anycoder"},
+            {"label": "Model", "url": "https://huggingface.co/kyutai/stt-2.6b-en-trfs"},
         ],
+        mcp_server=True,
     )