Spaces:

Fanny1366
/

assignment

Sleeping

Fanny1366 commited on Mar 9

Commit

3fceda9

verified ·

1 Parent(s): 7b4668d

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -2,7 +2,7 @@
 import streamlit as st
 from transformers import pipeline
 from gtts import gTTS
-import os
 # function part
 # img2text
@@ -14,15 +14,19 @@ def img2text(url):
 # text2story
 def text2story(text):
-    story_text = pipeline("text-generation", model="perplexity-ai/r1-1776", trust_remote_code=True)  # to be completed
     return story_text
 # text2audio
 def text2audio(story_text):
-    # Convert text to audio using gTTS
-    tts = gTTS(story_text, lang="en")
-    audio_file = "story_audio.wav"
-    tts.save(audio_file)
     return audio_file
 # main part
@@ -55,12 +59,10 @@ if uploaded_file is not None:
     #Stage 3: Story to Audio data
     st.text('Generating audio data...')
-    audio_data =text2audio(story)
     # Play button
     if st.button("Play Audio"):
-        st.audio(audio_data['audio'],
                     format="audio/wav",
-                    start_time=0,
-                    sample_rate = audio_data['sampling_rate'])
-        st.audio("kids_playing_audio.wav")

 import streamlit as st
 from transformers import pipeline
 from gtts import gTTS
+import io
 # function part
 # img2text
 # text2story
 def text2story(text):
+    story_pipeline = pipeline("text-generation", model="perplexity-ai/r1-1776", trust_remote_code=True)
+    story_text = story_pipeline(text, max_length=200)[0]['generated_text']
     return story_text
 # text2audio
 def text2audio(story_text):
+    # 使用 gTTS 将文本转换为音频
+    tts = gTTS(text=story_text, lang='en')
+    # 创建一个内存中的字节流
+    audio_file = io.BytesIO()
+    # 将音频保存到字节流中
+    tts.write_to_fp(audio_file)
+    audio_file.seek(0)
     return audio_file
 # main part
     #Stage 3: Story to Audio data
     st.text('Generating audio data...')
+    audio_data = text2audio(story)
     # Play button
     if st.button("Play Audio"):
+        st.audio(audio_data,
                     format="audio/wav",
+                    start_time=0)