Spaces:

Archime
/

canary_aed_streaming

Running on Zero

App Files Files Community

Archime commited on Nov 19

Commit

f76a38c

1 Parent(s): fc64c8b

add 3 step

Browse files

Files changed (1) hide show

app.py +54 -100

app.py CHANGED Viewed

@@ -4,49 +4,37 @@ from app.logger_config import (
 )
 import numpy as np
 import gradio as gr
-import asyncio
 from fastrtc.webrtc import WebRTC
 from fastrtc.utils import AdditionalOutputs
 from pydub import AudioSegment
-import time
-import os
 from gradio.utils import get_space
 from app.utils import (
-    raise_error,
     READ_SIZE,
     generate_coturn_config,
     read_and_stream_audio,
     stop_streaming,
-    task,
-    task_fake
 )
 from app.session_utils import (
     on_load,
     on_unload,
     get_active_session_hashes,
-    register_session_hash_code,
     reset_all_active_sessions,
-    get_active_task_flag_file,
-    remove_active_task_flag_file
 )
-from app.ui_utils import (
-    SUPPORTED_LANGS_MAP,
-    EXAMPLE_CONFIGS,
-    apply_preset_if_example,
-    reset_to_defaults,
-    summarize_config,
-    handle_additional_outputs,
-    get_custom_theme,
-    on_file_load
-)
-import nemo.collections.asr as nemo_asr
-from app.session_utils import (
-    get_active_task_flag_file,
-    get_session_hashe_chunks_dir
-)
 import spaces
 # --------------------------------------------------------
 # Initialization
@@ -109,43 +97,14 @@ with gr.Blocks(theme=theme, css=css_style) as demo:
                             """
                         )
-            btn_proceed_streaming = gr.Button("Proceed to Streaming", visible=False)
-            ui_components_oload_audio = [active_filepath, btn_proceed_streaming]
             main_audio.change(fn=on_file_load, inputs=[main_audio], outputs=ui_components_oload_audio)
-            # main_audio.stop_recording(fn=on_file_load, inputs=[main_audio], outputs=ui_components_one)
-            # main_audio.clear(fn=on_file_load, inputs=[main_audio], outputs=ui_components_one)
-            btn_proceed_streaming.click(lambda: gr.Walkthrough(selected=1), outputs=walkthrough)
         # === STEP 2 ===
-        with gr.Step("Stream", id=1) as audio_stream:
-            gr.Markdown("### Step 2: Start audio streaming")
-            with gr.Group():
-                with gr.Column():
-                    webrtc_stream = WebRTC(
-                        label="Live Stream",
-                        mode="receive",
-                        modality="audio",
-                        rtc_configuration=generate_coturn_config(),
-                        visible=True,
-                        inputs=main_audio,
-                    )
-            start_stream_button = gr.Button("▶️ Start Streaming", variant="primary")
-            webrtc_stream.stream(
-                fn=read_and_stream_audio,
-                inputs=[active_filepath, session_hash_code,gr.State(READ_SIZE)],
-                outputs=[webrtc_stream],
-                trigger=start_stream_button.click,
-                concurrency_id="audio_stream",
-                concurrency_limit=10,
-            )
-            status_message_stream = gr.Markdown("", elem_id="status-message-stream", visible=False)
-            go_to_config = gr.Button("Go to Configuration", visible=False, variant="secondary")
-            go_to_config.click(lambda: gr.Walkthrough(selected=2), outputs=walkthrough)
-        # === STEP 3 ===
-        with gr.Step("Configuration", id=2):
             gr.Markdown("### Step 3: Configure the Task")
             with gr.Group():
                 with gr.Row():
@@ -234,24 +193,49 @@ with gr.Blocks(theme=theme, css=css_style) as demo:
             )
             go_to_task = gr.Button("Go to Task")
-            go_to_task.click(lambda: gr.Walkthrough(selected=3), outputs=walkthrough)
-        # === STEP 4 ===
-        with gr.Step("Task", id=3) as task_step:
-                with gr.Row():
-                    gr.Markdown("## Step 4: Start the Task")
                 with gr.Row():
                     with gr.Column():
                         status_slider = gr.Slider(
                             0, 100,
                             value=0,
-                            label="Streaming Progress",
                             show_label=True,
                             interactive=False,
                             visible=False,
                             show_reset_button=False
                         )
-                        stop_stream_button = gr.Button("⏹️ Stop Streaming", visible=False,variant="stop")
                 with gr.Row():
                     gr.Markdown("---")
                 with gr.Row():
@@ -270,7 +254,7 @@ with gr.Blocks(theme=theme, css=css_style) as demo:
                 with gr.Row():
                     status_message_task = gr.Markdown("", elem_id="status-message-task",elem_classes=["info"], visible=False)
                 with gr.Row():
-                    start_task_button = gr.Button("▶️ Start Task", visible=True, variant="primary")
                     stop_task_button = gr.Button("⏹️ Stop Task", visible=False,variant="stop")
                     stop_stream_button.click(
@@ -278,46 +262,16 @@ with gr.Blocks(theme=theme, css=css_style) as demo:
                             inputs=[session_hash_code],
                         )
-                    def stop_task_fn(session_hash_code):
-                        remove_active_task_flag_file(session_hash_code)
-                        yield "Task stopped by user."
                     stop_task_button.click(
                         fn=stop_task_fn,
                         inputs=session_hash_code,
-                            outputs=task_output
                         )
-                            # task(session_hash_code)
                     config_task_ui = [session_hash_code,task_type, lang_source, lang_target,
                             chunk_secs, left_context_secs, right_context_secs,
                             streaming_policy, alignatt_thr, waitk_lagging,
                             exclude_sink_frames, xatt_scores_layer, hallucinations_detector]
-                    def start_task_asr_ast(
-                            session_hash_code,
-                            task_type, lang_source, lang_target,
-                            chunk_secs, left_context_secs, right_context_secs,
-                            streaming_policy, alignatt_thr, waitk_lagging,
-                            exclude_sink_frames, xatt_scores_layer, hallucinations_detector
-                                   ):
-                        """Stream transcription or translation results in real time."""
-                        accumulated = ""
-                        # Boucle sur le générateur de `task2()`
-                        for result, status, current_chunk in task(
-                            session_hash_code,
-                            task_type, lang_source, lang_target,
-                            chunk_secs, left_context_secs, right_context_secs,
-                            streaming_policy, alignatt_thr, waitk_lagging,
-                            exclude_sink_frames, xatt_scores_layer, hallucinations_detector
-                            ):
-                            if status == "success":
-                                yield accumulated + result, gr.update(visible=True,value=current_chunk , elem_classes=["info"]), gr.update(visible=False), gr.update(visible=True)
-                                accumulated += result
-                            elif status in ["warning","info" ]:
-                                yield accumulated, gr.update(visible=True,value=result , elem_classes=[status]), gr.update(visible=False), gr.update(visible=True)
-                            elif status in ["error", "done"]:
-                                yield accumulated, gr.update(visible=True,value=result , elem_classes=[status]), gr.update(visible=True), gr.update(visible=False)
                     start_task_button.click(
@@ -330,11 +284,11 @@ with gr.Blocks(theme=theme, css=css_style) as demo:
                                 exclude_sink_frames, xatt_scores_layer, hallucinations_detector
                             ],
-                            outputs=[task_output,status_message_task,start_task_button,stop_task_button]
                     )
                     ui_components = [
-                        start_stream_button, stop_stream_button,
                         go_to_config, audio_source_step, status_slider,walkthrough,status_message_stream
                     ]

 )
 import numpy as np
 import gradio as gr
 from fastrtc.webrtc import WebRTC
 from fastrtc.utils import AdditionalOutputs
 from pydub import AudioSegment
 from gradio.utils import get_space
+from app.supported_languages import (
+    SUPPORTED_LANGS_MAP,
+)
+from app.ui_utils import (
+    EXAMPLE_CONFIGS,
+    apply_preset_if_example,
+    reset_to_defaults,
+    summarize_config,
+    handle_additional_outputs,
+    get_custom_theme,
+    on_file_load,
+    start_task_asr_ast,
+    stop_task_fn
+)
 from app.utils import (
     READ_SIZE,
     generate_coturn_config,
     read_and_stream_audio,
     stop_streaming,
 )
 from app.session_utils import (
     on_load,
     on_unload,
     get_active_session_hashes,
     reset_all_active_sessions,
 )
 import spaces
 # --------------------------------------------------------
 # Initialization
                             """
                         )
+            go_to_config = gr.Button("Go to Configuration", visible=False)
+            ui_components_oload_audio = [active_filepath, go_to_config]
             main_audio.change(fn=on_file_load, inputs=[main_audio], outputs=ui_components_oload_audio)
+            go_to_config.click(lambda: gr.Walkthrough(selected=1), outputs=walkthrough)
         # === STEP 2 ===
+        with gr.Step("Configuration", id=1)as config_step:
             gr.Markdown("### Step 3: Configure the Task")
             with gr.Group():
                 with gr.Row():
             )
             go_to_task = gr.Button("Go to Task")
+            go_to_task.click(lambda: gr.Walkthrough(selected=2), outputs=walkthrough)
+        # === STEP 3 ===
+        with gr.Step("Task", id=2) as task_step:
                 with gr.Row():
+                    gr.Markdown("## Step 4: Start Stream Task")
+                with gr.Group():
                     with gr.Column():
+                        webrtc_stream = WebRTC(
+                            label="Live Stream",
+                            mode="receive",
+                            modality="audio",
+                            rtc_configuration=generate_coturn_config(),
+                            visible=True,
+                            inputs=main_audio,
+                            icon= "https://cdn-icons-png.flaticon.com/128/18429/18429788.png",
+                            pulse_color= "#df7a7a",
+                            icon_radius= "10px",
+                            icon_button_color= "rgb(255, 255, 255)",
+                            height=150,
+                            show_label=False
+                        )
                         status_slider = gr.Slider(
                             0, 100,
                             value=0,
+                            label="Streaming Progress %",
                             show_label=True,
                             interactive=False,
                             visible=False,
                             show_reset_button=False
                         )
+                start_stream_button = gr.Button("▶️ Start Streaming", variant="primary")
+                stop_stream_button = gr.Button("⏹️ Stop Streaming", visible=False,variant="stop")
+                webrtc_stream.stream(
+                    fn=read_and_stream_audio,
+                    inputs=[active_filepath, session_hash_code,gr.State(READ_SIZE)],
+                    outputs=[webrtc_stream],
+                    trigger=start_stream_button.click,
+                    concurrency_id="audio_stream",
+                    concurrency_limit=10,
+                )
+                status_message_stream = gr.Markdown("", elem_id="status-message-stream", visible=False)
                 with gr.Row():
                     gr.Markdown("---")
                 with gr.Row():
                 with gr.Row():
                     status_message_task = gr.Markdown("", elem_id="status-message-task",elem_classes=["info"], visible=False)
                 with gr.Row():
+                    start_task_button = gr.Button("▶️ Start Task", visible=False, variant="primary")
                     stop_task_button = gr.Button("⏹️ Stop Task", visible=False,variant="stop")
                     stop_stream_button.click(
                             inputs=[session_hash_code],
                         )
                     stop_task_button.click(
                         fn=stop_task_fn,
                         inputs=session_hash_code,
+                        outputs=task_output
                         )
                     config_task_ui = [session_hash_code,task_type, lang_source, lang_target,
                             chunk_secs, left_context_secs, right_context_secs,
                             streaming_policy, alignatt_thr, waitk_lagging,
                             exclude_sink_frames, xatt_scores_layer, hallucinations_detector]
                     start_task_button.click(
                                 exclude_sink_frames, xatt_scores_layer, hallucinations_detector
                             ],
+                            outputs=[task_output,status_message_task,start_task_button,stop_task_button,config_step]
                     )
                     ui_components = [
+                        start_stream_button, stop_stream_button,start_task_button,
                         go_to_config, audio_source_step, status_slider,walkthrough,status_message_stream
                     ]