Spaces:

Dragneel
/

TinyLlama

Sleeping

Drag2121 commited on Sep 17, 2024

Commit

4e963c4

1 Parent(s): 0af890e

stream word

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,4 +1,5 @@
 import os
 from fastapi import FastAPI, HTTPException
 from fastapi.responses import StreamingResponse
 from pydantic import BaseModel
@@ -44,9 +45,20 @@ async def ask_question_stream(question: Question):
         async def generate():
             full_response = ""
             async for chunk in llm.astream(question.text):
-                full_response += chunk
-                yield chunk
             # Log the full response after streaming is complete
             logger.info(f"Full streamed response: {full_response}")

 import os
+import re
 from fastapi import FastAPI, HTTPException
 from fastapi.responses import StreamingResponse
 from pydantic import BaseModel
         async def generate():
             full_response = ""
+            buffer = ""
             async for chunk in llm.astream(question.text):
+                buffer += chunk
+                words = re.findall(r'\S+|\s+', buffer)
+                for word in words[:-1]:
+                    full_response += word
+                    yield word
+                buffer = words[-1] if words else ""
+            if buffer:
+                full_response += buffer
+                yield buffer
             # Log the full response after streaming is complete
             logger.info(f"Full streamed response: {full_response}")