Spaces:

WJ88
/

Parakeet-TDT-v3-ASR-Demo_Real-Time_Mic-File_Transcription

Runtime error

App Files Files Community

WJ88 commited on Oct 18, 2025

Commit

d8eb8af

verified ·

1 Parent(s): 65c1721

i hate ui v5657

Browse files

Files changed (1) hide show

app.py +27 -23

app.py CHANGED Viewed

@@ -291,13 +291,35 @@ with gr.Blocks(title="Parakeet-TDT v3 (Unified MALSD Beam)") as demo:
     # Header
     gr.Markdown("### RELEASE: GIGA-CHAD-v.0.7")
     # Interactive Tabs
     with gr.Tab("Mic"):
         # Live audio input and output components
         mic = gr.Audio(
             sources=["microphone"], type="numpy", streaming=True, label="Speak"
         )
-        text_out = gr.Textbox(label="Transcript", lines=8)
         flush_btn = gr.Button("Flush")
         # Session state for maintaining context across streams
@@ -319,8 +341,9 @@ with gr.Blocks(title="Parakeet-TDT v3 (Unified MALSD Beam)") as demo:
         results_table = gr.Dataframe(
             headers=["file", "text"],
             label="Results",
-            row_count=(0, "dynamic"),
             col_count=(2, "fixed"),
         )
         # Event: Process uploaded files and update table
         run_btn.click(files_run, inputs=[files], outputs=[results_table])
@@ -393,27 +416,6 @@ with gr.Blocks(title="Parakeet-TDT v3 (Unified MALSD Beam)") as demo:
     )
     gr.HTML(highlights_html)
-    # Features Table (Static Data)
-    features_data = [
-        ["Model Setup", "Loads Parakeet-TDT-0.6b-v3 (RNNT-based) with MALSD "
-         "decoding for beam exploration and loop labels for alignments."],
-        ["Audio Handling", "Resamples to 16kHz mono, supports various formats."],
-        ["Streaming (Mic)", "Partial hypotheses for seamless updates, "
-         "session-based for multi-chunk context."],
-        ["UI", "Gradio tabs—Mic for live input/output (flush to finalize), "
-         "Files for batch results table."],
-        ["Tech Stack", "NeMo (ASR core), Gradio (web UI), Torchaudio/Soundfile "
-         "(audio utils)."],
-    ]
-    gr.Dataframe(
-        value=features_data,
-        headers=["Feature", "Description"],
-        datatype=["text", "text"],
-        row_count=(len(features_data), "fixed"),
-        col_count=(2, "fixed"),
-        interactive=False,
-    )
     # TODO Section
     todo_html = (
         "<h3>TODO:</h3>"
@@ -426,4 +428,6 @@ with gr.Blocks(title="Parakeet-TDT v3 (Unified MALSD Beam)") as demo:
     )
     gr.HTML(todo_html)
 demo.queue().launch(ssr_mode=False)

     # Header
     gr.Markdown("### RELEASE: GIGA-CHAD-v.0.7")
+    # Features Table (Static Data) - Moved here for prominence after title
+    features_data = [
+        ["Model Setup", "Loads Parakeet-TDT-0.6b-v3 (RNNT-based) with MALSD "
+         "decoding for beam exploration and loop labels for alignments."],
+        ["Audio Handling", "Resamples to 16kHz mono, supports various formats."],
+        ["Streaming (Mic)", "Partial hypotheses for seamless updates, "
+         "session-based for multi-chunk context."],
+        ["UI", "Gradio tabs—Mic for live input/output (flush to finalize), "
+         "Files for batch results table."],
+        ["Tech Stack", "NeMo (ASR core), Gradio (web UI), Torchaudio/Soundfile "
+         "(audio utils)."],
+    ]
+    gr.Dataframe(
+        value=features_data,
+        headers=["Feature", "Description"],
+        datatype=["text", "text"],
+        row_count=(len(features_data), "fixed"),
+        col_count=(2, "fixed"),
+        interactive=False,
+        wrap=True,  # Ensures text wraps for better visibility in cells
+    )
     # Interactive Tabs
     with gr.Tab("Mic"):
         # Live audio input and output components
         mic = gr.Audio(
             sources=["microphone"], type="numpy", streaming=True, label="Speak"
         )
+        text_out = gr.Textbox(label="Transcript", lines=4)  # Reduced height for visibility
         flush_btn = gr.Button("Flush")
         # Session state for maintaining context across streams
         results_table = gr.Dataframe(
             headers=["file", "text"],
             label="Results",
+            row_count=(5, "dynamic"),  # Limited initial rows for smaller window
             col_count=(2, "fixed"),
+            wrap=True,  # Text wraps to keep visible without horizontal scroll
         )
         # Event: Process uploaded files and update table
         run_btn.click(files_run, inputs=[files], outputs=[results_table])
     )
     gr.HTML(highlights_html)
     # TODO Section
     todo_html = (
         "<h3>TODO:</h3>"
     )
     gr.HTML(todo_html)
+# Launch Configuration
+# Note: ssr_mode=False disables server-side rendering for better real-time streaming performance.
 demo.queue().launch(ssr_mode=False)