documentaitestv3

Sleeping

App Files Files Community

danegergo commited on Apr 1

Commit

e4de5ab

1 Parent(s): 0adaf09

fixed shared transcript issue

Browse files

Files changed (1) hide show

app.py +5 -6

app.py CHANGED Viewed

@@ -31,7 +31,6 @@ WEBSOCKET_HEADERS = {
     "OpenAI-Beta": "realtime=v1"
 }
-transcription = ""
 css = """
 """
@@ -45,6 +44,7 @@ class WebSocketClient:
         self.queue = asyncio.Queue(maxsize=10)
         self.loop = None
         self.client_id = client_id
     async def connect(self):
         try:
@@ -66,15 +66,14 @@ class WebSocketClient:
         self.loop.run_until_complete(self.connect())
     def process_websocket_message(self, message: Data):
-        global transcription
         message_object = json.loads(message)
         if message_object["type"] != "error":
             print(f"{LogColors.OK}Received message: {LogColors.ENDC} {message}")
             if message_object["type"] == "conversation.item.input_audio_transcription.delta":
                 delta = message_object["delta"]
-                transcription += delta
             elif message_object["type"] == "conversation.item.input_audio_transcription.completed":
-                transcription += ' ' if len(transcription) and transcription[-1] != ' ' else ''
         else:
             print(f"{LogColors.ERROR}Error: {message}{LogColors.ENDC}")
@@ -130,7 +129,7 @@ def send_audio_chunk(new_chunk: gr.Audio, client_id: str):
         return "Connection is being established, please try again in a few seconds."
     sr, y = new_chunk
     connections[client_id].enqueue_audio_chunk(sr, y)
-    return transcription
 def create_new_websocket_connection():
     client_id = str(uuid.uuid4())
@@ -143,7 +142,7 @@ if __name__ == "__main__":
         gr.Markdown(f"# Realtime transcription demo")
         with gr.Row():
             with gr.Column():
-                output_textbox = gr.Textbox(label="Transcription", value="", lines=7, interactive=False, autoscroll=True)
         with gr.Row():
             with gr.Column(scale=5):
                 audio_input = gr.Audio(streaming=True, format="wav")

     "OpenAI-Beta": "realtime=v1"
 }
 css = """
 """
         self.queue = asyncio.Queue(maxsize=10)
         self.loop = None
         self.client_id = client_id
+        self.transcript = ""
     async def connect(self):
         try:
         self.loop.run_until_complete(self.connect())
     def process_websocket_message(self, message: Data):
         message_object = json.loads(message)
         if message_object["type"] != "error":
             print(f"{LogColors.OK}Received message: {LogColors.ENDC} {message}")
             if message_object["type"] == "conversation.item.input_audio_transcription.delta":
                 delta = message_object["delta"]
+                self.transcript += delta
             elif message_object["type"] == "conversation.item.input_audio_transcription.completed":
+                self.transcript += ' ' if len(self.transcript) and self.transcript[-1] != ' ' else ''
         else:
             print(f"{LogColors.ERROR}Error: {message}{LogColors.ENDC}")
         return "Connection is being established, please try again in a few seconds."
     sr, y = new_chunk
     connections[client_id].enqueue_audio_chunk(sr, y)
+    return connections[client_id].transcript
 def create_new_websocket_connection():
     client_id = str(uuid.uuid4())
         gr.Markdown(f"# Realtime transcription demo")
         with gr.Row():
             with gr.Column():
+                output_textbox = gr.Textbox(label="Transcript", value="", lines=7, interactive=False, autoscroll=True)
         with gr.Row():
             with gr.Column(scale=5):
                 audio_input = gr.Audio(streaming=True, format="wav")