Spaces:

Archime
/

canary_aed_streaming

Running on Zero

App Files Files Community

Archime commited on Nov 14

Commit

010aaff

1 Parent(s): 11c4a5a

ajust task for spaces.GPU

Browse files

Files changed (2) hide show

app.py +78 -2
app/utils.py +0 -70

app.py CHANGED Viewed

@@ -17,7 +17,7 @@ from app.utils import (
     generate_coturn_config,
     read_and_stream_audio,
     stop_streaming,
-    task
 )
 from app.session_utils import (
     on_load,
@@ -40,6 +40,11 @@ from app.ui_utils import (
     on_file_load
 )
 import nemo.collections.asr as nemo_asr
 # --------------------------------------------------------
 # Initialization
 # --------------------------------------------------------
@@ -63,6 +68,77 @@ streaming_audio_processor_config = StreamingAudioProcessorConfig(
     silence_threshold_chunks=1
 )
 streamer = StreamingAudioProcessor(speech_engine=canary_speech_engine,vad_engine=silero_vad_engine,cfg=streaming_audio_processor_config)
 with gr.Blocks(theme=theme, css=css_style) as demo:
@@ -291,7 +367,7 @@ with gr.Blocks(theme=theme, css=css_style) as demo:
                         yield f"Starting {task_type.lower()}...\n\n",gr.update(visible=False),gr.update(visible=True)
                         # Boucle sur le générateur de `task()`
-                        for msg in task(session_hash_code,streamer=streamer):
                             accumulated += msg
                             yield accumulated,gr.update(visible=False),gr.update(visible=True)

     generate_coturn_config,
     read_and_stream_audio,
     stop_streaming,
+    # task
 )
 from app.session_utils import (
     on_load,
     on_file_load
 )
 import nemo.collections.asr as nemo_asr
+from app.session_utils import (
+    get_active_task_flag_file,
+    get_folder_chunks
+)
+import spaces
 # --------------------------------------------------------
 # Initialization
 # --------------------------------------------------------
     silence_threshold_chunks=1
 )
 streamer = StreamingAudioProcessor(speech_engine=canary_speech_engine,vad_engine=silero_vad_engine,cfg=streaming_audio_processor_config)
+@spaces.GPU
+def task(session_id: str):
+    """Continuously read and delete .npz chunks while task is active."""
+    active_flag = get_active_task_flag_file(session_id)
+    with open(active_flag, "w") as f:
+        f.write("1")
+    chunk_dir = get_folder_chunks(session_id)
+    logging.info(f"[{session_id}] task started. {chunk_dir}")
+    try:
+        logging.info(f"[{session_id}] task loop started.")
+        yield f"Task started for session {session_id}\n\n"
+        while os.path.exists(active_flag):
+            if not os.path.exists(chunk_dir):
+                logging.warning(f"[{session_id}] No chunk directory found for task.")
+                yield "No audio chunks yet... waiting for stream.\n"
+                time.sleep(0.1)
+                continue
+            files = sorted(f for f in os.listdir(chunk_dir) if f.endswith(".npz"))
+            if not files:
+                time.sleep(0.1)
+                continue
+            for fname in files:
+                fpath = os.path.join(chunk_dir, fname)
+                try:
+                    npz = np.load(fpath)
+                    samples = npz["data"]
+                    rate = int(npz["rate"])
+                    text = f"Transcribed {fname}: {len(samples)} samples @ {rate}Hz"
+                    new_texts = streamer.process_chunk(samples)
+                    for text in new_texts:
+                        print(text, end='', flush=True)
+                        yield f"{text}"
+                        logging.debug(f"[{session_id}] {new_texts}")
+                    # yield f"{text}\n"
+                    os.remove(fpath)
+                    logging.debug(f"[{session_id}] Deleted processed chunk: {fname}")
+                except Exception as e:
+                    logging.error(f"[{session_id}] Error processing {fname}: {e}")
+                    yield f"Error processing {fname}: {e}\n"
+                    continue
+            time.sleep(0.1)
+            # raise_function()
+        final_text = streamer.finalize_stream()
+        if final_text:
+            print(final_text, end='', flush=True)
+        yield f"\n{final_text}"
+        # yield f"\n"
+        logging.info(f"[{session_id}] task loop ended (flag removed).")
+    except Exception as e:
+        logging.error(f"[{session_id}] task error: {e}", exc_info=True)
+        yield f"Unexpected error: {e}\n"
+    finally:
+        # active_flag = os.path.join(TMP_DIR, f"transcribe_active_{session_id}.txt")
+        if os.path.exists(active_flag):
+            os.remove(active_flag)
+        logging.info(f"[{session_id}] task stopped.")
+        try:
+            if os.path.exists(chunk_dir) and not os.listdir(chunk_dir):
+                os.rmdir(chunk_dir)
+                logging.debug(f"[{session_id}] Cleaned up empty chunk dir.")
+        except Exception as e:
+            logging.error(f"[{session_id}] Cleanup error: {e}")
+            yield "\nCleanup error: {e}"
+        logging.info(f"[{session_id}] Exiting task loop.")
+        yield "\nTask finished and cleaned up.\n"
 with gr.Blocks(theme=theme, css=css_style) as demo:
                         yield f"Starting {task_type.lower()}...\n\n",gr.update(visible=False),gr.update(visible=True)
                         # Boucle sur le générateur de `task()`
+                        for msg in task(session_hash_code):
                             accumulated += msg
                             yield accumulated,gr.update(visible=False),gr.update(visible=True)

app/utils.py CHANGED Viewed

@@ -156,78 +156,8 @@ else:
 # --- Audio Stream Function ---
-@spaces.GPU
-def task(session_id: str, streamer:  StreamingAudioProcessor):
-    """Continuously read and delete .npz chunks while task is active."""
-    active_flag = get_active_task_flag_file(session_id)
-    with open(active_flag, "w") as f:
-        f.write("1")
-    chunk_dir = get_folder_chunks(session_id)
-    logging.info(f"[{session_id}] task started. {chunk_dir}")
-    try:
-        logging.info(f"[{session_id}] task loop started.")
-        yield f"Task started for session {session_id}\n\n"
-        while os.path.exists(active_flag):
-            if not os.path.exists(chunk_dir):
-                logging.warning(f"[{session_id}] No chunk directory found for task.")
-                yield "No audio chunks yet... waiting for stream.\n"
-                time.sleep(0.1)
-                continue
-            files = sorted(f for f in os.listdir(chunk_dir) if f.endswith(".npz"))
-            if not files:
-                time.sleep(0.1)
-                continue
-            for fname in files:
-                fpath = os.path.join(chunk_dir, fname)
-                try:
-                    npz = np.load(fpath)
-                    samples = npz["data"]
-                    rate = int(npz["rate"])
-                    text = f"Transcribed {fname}: {len(samples)} samples @ {rate}Hz"
-                    new_texts = streamer.process_chunk(samples)
-                    for text in new_texts:
-                        print(text, end='', flush=True)
-                        yield f"{text}"
-                        logging.debug(f"[{session_id}] {new_texts}")
-                    # yield f"{text}\n"
-                    os.remove(fpath)
-                    logging.debug(f"[{session_id}] Deleted processed chunk: {fname}")
-                except Exception as e:
-                    logging.error(f"[{session_id}] Error processing {fname}: {e}")
-                    yield f"Error processing {fname}: {e}\n"
-                    continue
-            time.sleep(0.1)
-            # raise_function()
-        final_text = streamer.finalize_stream()
-        if final_text:
-            print(final_text, end='', flush=True)
-        yield f"\n{final_text}"
-        # yield f"\n"
-        logging.info(f"[{session_id}] task loop ended (flag removed).")
-    except Exception as e:
-        logging.error(f"[{session_id}] task error: {e}", exc_info=True)
-        yield f"Unexpected error: {e}\n"
-    finally:
-        # active_flag = os.path.join(TMP_DIR, f"transcribe_active_{session_id}.txt")
-        if os.path.exists(active_flag):
-            os.remove(active_flag)
-        logging.info(f"[{session_id}] task stopped.")
-        try:
-            if os.path.exists(chunk_dir) and not os.listdir(chunk_dir):
-                os.rmdir(chunk_dir)
-                logging.debug(f"[{session_id}] Cleaned up empty chunk dir.")
-        except Exception as e:
-            logging.error(f"[{session_id}] Cleanup error: {e}")
-            yield "\nCleanup error: {e}"
-        logging.info(f"[{session_id}] Exiting task loop.")
-        yield "\nTask finished and cleaned up.\n"


156
157
158	# --- Audio Stream Function ---








159
160






























































161
162
163