Spaces:

Fanny1366
/

assignment

Sleeping

Fanny1366 commited on Mar 9

Commit

90d9abf

verified ·

1 Parent(s): 7f4f62a

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -14,15 +14,15 @@ def img2text(url):
 # text2story
 def text2story(text):
-    story_pipeline = pipeline("text-generation", model="facebook/opt-125m")
-    # 调用 pipeline 生成故事文本
     result = story_pipeline(text, max_length=200, num_return_sequences=1)
     story_text = result[0]['generated_text']
     return story_text
 # text2audio
 def text2audio(story_text):
-    # 使用 gTTS 库将文本转换为音频
     tts = gTTS(text=story_text, lang='en')
     # 创建一个内存中的字节流对象，用于存储音频数据
     audio_file = io.BytesIO()
@@ -30,7 +30,7 @@ def text2audio(story_text):
     tts.write_to_fp(audio_file)
     # 将文件指针移动到文件开头，以便后续读取
     audio_file.seek(0)
-    return audio_file
 # main part
 st.set_page_config(page_title="Your Image to Audio Story",
@@ -63,4 +63,7 @@ if uploaded_file is not None:
     # Play button
     if st.button("Play Audio"):
-        st.audio(audio_data, format="audio/mpeg")

 # text2story
 def text2story(text):
+    # 使用 Hugging Face 的 text-generation 模型生成故事
+    story_pipeline = pipeline("text-generation", model="agentica-org/DeepScaleR-1.5B-Preview")
     result = story_pipeline(text, max_length=200, num_return_sequences=1)
     story_text = result[0]['generated_text']
     return story_text
 # text2audio
 def text2audio(story_text):
+    # 使用 gTTS 将文本转换为音频
     tts = gTTS(text=story_text, lang='en')
     # 创建一个内存中的字节流对象，用于存储音频数据
     audio_file = io.BytesIO()
     tts.write_to_fp(audio_file)
     # 将文件指针移动到文件开头，以便后续读取
     audio_file.seek(0)
+    return {'audio': audio_file, 'sampling_rate': 16000}  # 返回音频数据和采样率
 # main part
 st.set_page_config(page_title="Your Image to Audio Story",
     # Play button
     if st.button("Play Audio"):
+        st.audio(audio_data['audio'],
+                 format="audio/wav",
+                 start_time=0,
+                 sample_rate=audio_data['sampling_rate'])