Spaces:

Archime
/

canary_aed_streaming

Running on Zero

App Files Files Community

Archime commited on Nov 18

Commit

799a0f6

1 Parent(s): 935d736

rename somme functions

Browse files

Files changed (4) hide show

app.py +17 -72
app/session_utils.py +3 -3
app/streaming_audio_processor.py +3 -4
app/utils.py +8 -12

app.py CHANGED Viewed

@@ -13,7 +13,7 @@ import os
 from gradio.utils import get_space
 from app.utils import (
-    raise_function,
     READ_SIZE,
     generate_coturn_config,
     read_and_stream_audio,
@@ -24,9 +24,9 @@ from app.utils import (
 from app.session_utils import (
     on_load,
     on_unload,
-    get_active_session_hash_code,
     register_session_hash_code,
-    reset_all_active_session_hash_code,
     get_active_task_flag_file,
     remove_active_task_flag_file
@@ -45,39 +45,29 @@ from app.ui_utils import (
 import nemo.collections.asr as nemo_asr
 from app.session_utils import (
     get_active_task_flag_file,
-    get_folder_chunks
 )
 import spaces
 # --------------------------------------------------------
 # Initialization
 # --------------------------------------------------------
-reset_all_active_session_hash_code()
 theme,css_style = get_custom_theme()
-# logger.info(f'Hydra config: {OmegaConf.to_yaml(cfg)}')
-from app.streaming_audio_processor import StreamingAudioProcessorConfig
-# asr_model = None
 with gr.Blocks(theme=theme, css=css_style) as demo:
     session_hash_code = gr.State()
-    session_hash_code_box = gr.Textbox(label="Session ID", interactive=False, visible=DEBUG)
-    with gr.Accordion("📊 Active Sessions Hash", open=True ,visible=DEBUG):
-        sessions_table = gr.DataFrame(
-            headers=["session_hash_code", "file", "start_time", "status"],
-            interactive=False,
-            wrap=True,
-            max_height=200,
-        )
-        gr.Timer(3.0).tick(fn=get_active_session_hash_code, outputs=sessions_table)
     demo.load(fn=on_load, inputs=None, outputs=[session_hash_code, session_hash_code_box])
     demo.unload(fn=on_unload)
@@ -303,28 +293,8 @@ with gr.Blocks(theme=theme, css=css_style) as demo:
                             chunk_secs, left_context_secs, right_context_secs,
                             streaming_policy, alignatt_thr, waitk_lagging,
                             exclude_sink_frames, xatt_scores_layer, hallucinations_detector]
-                    def start_transcription(
-                        session_hash_code,
-                        task_type, lang_source, lang_target,
-                        chunk_secs, left_context_secs, right_context_secs,
-                        streaming_policy, alignatt_thr, waitk_lagging,
-                        exclude_sink_frames, xatt_scores_layer, hallucinations_detector
-                        ):
-                        """Stream transcription or translation results in real time."""
-                        accumulated = ""
-                        yield f"Starting {task_type.lower()}...\n\n",gr.update(visible=False),gr.update(visible=True)
-                        # Boucle sur le générateur de `task()`
-                        for msg in task(session_hash_code,config_task_ui):
-                            accumulated += msg
-                            yield accumulated,gr.update(visible=False),gr.update(visible=True)
-                        yield accumulated + "\nDone.",gr.update(visible=True),gr.update(visible=False)
-                    def start_task(
                             session_hash_code,
                             task_type, lang_source, lang_target,
                             chunk_secs, left_context_secs, right_context_secs,
@@ -351,7 +321,7 @@ with gr.Blocks(theme=theme, css=css_style) as demo:
                     start_task_button.click(
-                            fn=start_task,
                             inputs=[
                                 session_hash_code,
                                 task_type, lang_source, lang_target,
@@ -363,18 +333,6 @@ with gr.Blocks(theme=theme, css=css_style) as demo:
                             outputs=[task_output,status_message_task,start_task_button,stop_task_button]
                     )
-                        # start_task_button.click(
-                        #     fn=start_task,
-                        #     inputs=[
-                        #         session_hash_code,
-                        #         task_type, lang_source, lang_target,
-                        #         chunk_secs, left_context_secs, right_context_secs,
-                        #         streaming_policy, alignatt_thr, waitk_lagging,
-                        #         exclude_sink_frames, xatt_scores_layer, hallucinations_detector
-                        #     ],
-                        #     outputs=[task_output,status_message_task,start_task_button,stop_task_button]
-                        # )
                     ui_components = [
                         start_stream_button, stop_stream_button,
                         go_to_config, audio_source_step, status_slider,walkthrough,status_message_stream
@@ -388,19 +346,6 @@ with gr.Blocks(theme=theme, css=css_style) as demo:
                         concurrency_limit=10,
                     )
-                        # def toggle_task_buttons():
-                        #     return (
-                        #         gr.update(visible=False),
-                        #         gr.update(visible=True),
-                        #         gr.update(visible=True)
-                        #     )
-                        # start_task_button.click(
-                        #     fn=toggle_task_buttons,
-                        #     inputs=None,
-                        #     outputs=[start_task_button, stop_task_button, stop_stream_button],
-                        #     queue=False
-                        # )
 if __name__ == "__main__":

 from gradio.utils import get_space
 from app.utils import (
+    raise_error,
     READ_SIZE,
     generate_coturn_config,
     read_and_stream_audio,
 from app.session_utils import (
     on_load,
     on_unload,
+    get_active_session_hashes,
     register_session_hash_code,
+    reset_all_active_sessions,
     get_active_task_flag_file,
     remove_active_task_flag_file
 import nemo.collections.asr as nemo_asr
 from app.session_utils import (
     get_active_task_flag_file,
+    get_session_hashe_chunks_dir
 )
 import spaces
 # --------------------------------------------------------
 # Initialization
 # --------------------------------------------------------
+reset_all_active_sessions()
 theme,css_style = get_custom_theme()
 with gr.Blocks(theme=theme, css=css_style) as demo:
     session_hash_code = gr.State()
+    with gr.Accordion("DEGUG PANEL", open=False, visible=DEBUG):
+        session_hash_code_box = gr.Textbox(label="Session ID", interactive=False, visible=DEBUG)
+        with gr.Accordion("📊 Active Sessions Hash", open=True ,visible=DEBUG):
+            sessions_table = gr.DataFrame(
+                headers=["session_hash_code", "file", "start_time", "status"],
+                interactive=False,
+                wrap=True,
+                max_height=200,
+            )
+            gr.Timer(3.0).tick(fn=get_active_session_hashes, outputs=sessions_table)
     demo.load(fn=on_load, inputs=None, outputs=[session_hash_code, session_hash_code_box])
     demo.unload(fn=on_unload)
                             chunk_secs, left_context_secs, right_context_secs,
                             streaming_policy, alignatt_thr, waitk_lagging,
                             exclude_sink_frames, xatt_scores_layer, hallucinations_detector]
+                    def start_task_asr_ast(
                             session_hash_code,
                             task_type, lang_source, lang_target,
                             chunk_secs, left_context_secs, right_context_secs,
                     start_task_button.click(
+                            fn=start_task_asr_ast,
                             inputs=[
                                 session_hash_code,
                                 task_type, lang_source, lang_target,
                             outputs=[task_output,status_message_task,start_task_button,stop_task_button]
                     )
                     ui_components = [
                         start_stream_button, stop_stream_button,
                         go_to_config, audio_source_step, status_slider,walkthrough,status_message_stream
                         concurrency_limit=10,
                     )
 if __name__ == "__main__":

app/session_utils.py CHANGED Viewed

@@ -79,7 +79,7 @@ def ensure_tmp_dir():
         logging.error(f"Failed to create tmp directory {TMP_DIR}: {e}")
-def reset_all_active_session_hash_code():
     """Removes all temporary session_hash_code files and folders at startup."""
     ensure_tmp_dir()
@@ -210,7 +210,7 @@ def unregister_session_hash_code_hash(session_hash_code: str):
         logging.error(f"[{session_hash_code}] Error unregistering session_hash_code: {e}")
-def get_active_session_hash_code():
     """Returns active session_hash_codes as a list of rows for the DataFrame."""
     if not os.path.exists(ACTIVE_SESSIONS_HASH_FILE):
         return []
@@ -259,5 +259,5 @@ def remove_active_task_flag_file(session_hash_code: str):
         except Exception as e:
             logging.warning(f"[{session_hash_code}] Failed to remove file {fname}: {e}")
-def get_folder_chunks(session_hash_code: str):
      return os.path.join(TMP_DIR, f"{NAME_FOLDER_CHUNKS}{session_hash_code}")

         logging.error(f"Failed to create tmp directory {TMP_DIR}: {e}")
+def reset_all_active_sessions():
     """Removes all temporary session_hash_code files and folders at startup."""
     ensure_tmp_dir()
         logging.error(f"[{session_hash_code}] Error unregistering session_hash_code: {e}")
+def get_active_session_hashes():
     """Returns active session_hash_codes as a list of rows for the DataFrame."""
     if not os.path.exists(ACTIVE_SESSIONS_HASH_FILE):
         return []
         except Exception as e:
             logging.warning(f"[{session_hash_code}] Failed to remove file {fname}: {e}")
+def get_session_hashe_chunks_dir(session_hash_code: str):
      return os.path.join(TMP_DIR, f"{NAME_FOLDER_CHUNKS}{session_hash_code}")

app/streaming_audio_processor.py CHANGED Viewed

@@ -171,8 +171,7 @@ class StreamingAudioProcessor:
         Flushes anything remaining in the buffer.
         """
         logging.info("Finalizing stream. Flushing final buffer...")
-        final_text = self._flush_and_reset()
-        if final_text:
-            logging.info(f"Received final flushed text: '{final_text}'")
-        return final_text

         Flushes anything remaining in the buffer.
         """
         logging.info("Finalizing stream. Flushing final buffer...")
+        for reset_text in  self._flush_and_reset() :
+            logging.info(f"Received final flushed text: '{reset_text}'")
+            yield reset_text

app/utils.py CHANGED Viewed

@@ -19,7 +19,7 @@ from app.session_utils import (
     get_active_stream_flag_file,
     remove_active_stream_flag_file,
     remove_active_task_flag_file,
-    get_folder_chunks
 )
 from app.ui_utils import (
     SUPPORTED_LANGS_MAP
@@ -105,7 +105,7 @@ def read_and_stream_audio(filepath_to_stream: str, session_hash_code: str,read_s
             time.sleep(chunk_duration_ms/1000)
             #  Save only if transcription is active
             if os.path.exists(task_active_flag) :
-                chunk_dir = get_folder_chunks(session_hash_code)
                 if not os.path.exists(chunk_dir) :
                     os.makedirs(chunk_dir, exist_ok=True)
                 npz_path = os.path.join(chunk_dir, f"chunk_{i:05d}.npz")
@@ -114,7 +114,7 @@ def read_and_stream_audio(filepath_to_stream: str, session_hash_code: str,read_s
                     np.savez_compressed(npz_path, data=chunk_array, rate=frame_rate)
                     logging.debug(f"[{session_hash_code}] Saved chunk {i}/{total_chunks} (transcribe active) ({progress}%) ({npz_path}).")
-            # raise_function()  # Optional injected test exception
         logging.info(f"[{session_hash_code}] Audio streaming completed successfully.")
@@ -166,7 +166,7 @@ def task_fake(session_hash_code: str,
     active_flag = get_active_task_flag_file(session_hash_code)
     with open(active_flag, "w") as f:
         f.write("1")
-    chunk_dir = get_folder_chunks(session_hash_code)
     logging.info(f"[{session_hash_code}] task started. {chunk_dir}")
     try:
@@ -268,7 +268,7 @@ def task(session_hash_code: str,
     active_flag = get_active_task_flag_file(session_hash_code)
     with open(active_flag, "w") as f:
         f.write("1")
-    chunk_dir = get_folder_chunks(session_hash_code)
     logging.info(f"[{session_hash_code}] task started. {chunk_dir}")
     try:
@@ -308,8 +308,8 @@ def task(session_hash_code: str,
                 time.sleep(0.1)
         # TODO
-        # final_text = streamer.finalize_stream()
-        # yield (text, "success", final_text)
         # if final_text:
         #     print(final_text, end='', flush=True)
         # yield f"\n{final_text}"
@@ -392,7 +392,7 @@ def _is_stop_requested(session_hash_code) -> bool:
-def raise_function():
     """Raise an error randomly (1 out of 10 times)."""
     if random.randint(1, 10) == 1:
         raise RuntimeError("Random failure triggered!")
@@ -447,7 +447,3 @@ def get_current_device():
-def raise_function():
-    """Raise an error randomly (1 out of 10 times)."""
-    if random.randint(1, 50) == 1:
-        raise RuntimeError("Random failure triggered!")

     get_active_stream_flag_file,
     remove_active_stream_flag_file,
     remove_active_task_flag_file,
+    get_session_hashe_chunks_dir
 )
 from app.ui_utils import (
     SUPPORTED_LANGS_MAP
             time.sleep(chunk_duration_ms/1000)
             #  Save only if transcription is active
             if os.path.exists(task_active_flag) :
+                chunk_dir = get_session_hashe_chunks_dir(session_hash_code)
                 if not os.path.exists(chunk_dir) :
                     os.makedirs(chunk_dir, exist_ok=True)
                 npz_path = os.path.join(chunk_dir, f"chunk_{i:05d}.npz")
                     np.savez_compressed(npz_path, data=chunk_array, rate=frame_rate)
                     logging.debug(f"[{session_hash_code}] Saved chunk {i}/{total_chunks} (transcribe active) ({progress}%) ({npz_path}).")
+            # raise_error()  # Optional injected test exception
         logging.info(f"[{session_hash_code}] Audio streaming completed successfully.")
     active_flag = get_active_task_flag_file(session_hash_code)
     with open(active_flag, "w") as f:
         f.write("1")
+    chunk_dir = get_session_hashe_chunks_dir(session_hash_code)
     logging.info(f"[{session_hash_code}] task started. {chunk_dir}")
     try:
     active_flag = get_active_task_flag_file(session_hash_code)
     with open(active_flag, "w") as f:
         f.write("1")
+    chunk_dir = get_session_hashe_chunks_dir(session_hash_code)
     logging.info(f"[{session_hash_code}] task started. {chunk_dir}")
     try:
                 time.sleep(0.1)
         # TODO
+        for final_text in streamer.finalize_stream() :
+            yield (text, "success", final_text)
         # if final_text:
         #     print(final_text, end='', flush=True)
         # yield f"\n{final_text}"
+def raise_error():
     """Raise an error randomly (1 out of 10 times)."""
     if random.randint(1, 10) == 1:
         raise RuntimeError("Random failure triggered!")