czhaobt commited on
Commit
dadddbe
·
verified ·
1 Parent(s): da278ae

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +36 -55
app.py CHANGED
@@ -1,47 +1,29 @@
1
  import streamlit as st
2
  from transformers import pipeline
3
  from gtts import gTTS
4
- import io
5
  import os
6
 
7
  # function part
8
  # img2text
9
  def img2text(url):
10
- try:
11
- image_to_text_model = pipeline("image-to-text", model="Salesforce/blip-image-captioning-base")
12
- text = image_to_text_model(url)[0]["generated_text"]
13
- return text
14
- except Exception as e:
15
- st.error(f"图像转文本出错: {e}")
16
- return None
17
 
18
  # text2story
19
  def text2story(text):
20
- try:
21
- story_generator = pipeline("text-generation", model="Qwen/QwQ-32B-Preview")
22
- # 生成故事文本
23
- result = story_generator(text, max_length=200, num_return_sequences=1)
24
- story = result[0]['generated_text']
25
- return story
26
- except Exception as e:
27
- st.error(f"文本生成故事出错: {e}")
28
- return None
29
 
30
  # text2audio
31
  def text2audio(story_text):
32
- try:
33
- # 创建 gTTS 对象,将文本转换为语音
34
- tts = gTTS(text=story_text, lang='en')
35
- # 创建字节流对象用于存储音频数据
36
- audio_file = io.BytesIO()
37
- # 将音频数据写入字节流
38
- tts.write_to_fp(audio_file)
39
- # 移动文件指针到开头
40
- audio_file.seek(0)
41
- return audio_file
42
- except Exception as e:
43
- st.error(f"文本转音频出错: {e}")
44
- return None
45
 
46
  st.set_page_config(page_title="Your Image to Audio Story",
47
  page_icon="🦜")
@@ -49,35 +31,34 @@ st.header("Turn Your Image to Audio Story")
49
  uploaded_file = st.file_uploader("Select an Image...")
50
 
51
  if uploaded_file is not None:
52
- # 使用临时文件存储上传的图像
53
- temp_file_path = "temp_image.jpg"
54
  bytes_data = uploaded_file.getvalue()
55
- with open(temp_file_path, "wb") as file:
56
  file.write(bytes_data)
 
 
57
 
58
- # 显示上传的图像,使用 use_container_width 避免弃用警告
59
- st.image(uploaded_file, caption="Uploaded Image", use_container_width=True)
60
-
61
- # Stage 1: Image to Text
62
  st.text('Processing img2text...')
63
- scenario = img2text(temp_file_path)
64
- if scenario:
65
- st.write(scenario)
66
 
67
- # Stage 2: Text to Story
68
- st.text('Generating a story...')
69
- story = text2story(scenario)
70
- if story:
71
- st.write(story)
72
 
73
- # Stage 3: Story to Audio data
74
- st.text('Generating audio data...')
75
- audio_data = text2audio(story)
76
- if audio_data:
77
- # Play button
78
- if st.button("Play Audio"):
79
- st.audio(audio_data, format="audio/mpeg", start_time=0)
80
 
81
- # 删除临时文件
82
- if os.path.exists(temp_file_path):
83
- os.remove(temp_file_path)
 
 
 
 
 
 
 
 
1
  import streamlit as st
2
  from transformers import pipeline
3
  from gtts import gTTS
 
4
  import os
5
 
6
  # function part
7
  # img2text
8
  def img2text(url):
9
+ image_to_text_model = pipeline("image-to-text", model="Salesforce/blip-image-captioning-base")
10
+ text = image_to_text_model(url)[0]["generated_text"]
11
+ return text
 
 
 
 
12
 
13
  # text2story
14
  def text2story(text):
15
+ story_generator = pipeline("text-generation", model="agentica-org/DeepScaleR-1.5B-Preview")
16
+ story = story_generator(text, max_length=200, num_return_sequences=1)[0]['generated_text']
17
+ return story
 
 
 
 
 
 
18
 
19
  # text2audio
20
  def text2audio(story_text):
21
+ # 创建 gTTS 对象
22
+ tts = gTTS(text=story_text, lang='en')
23
+ # 保存音频文件
24
+ audio_file = "story_audio.wav"
25
+ tts.save(audio_file)
26
+ return audio_file
 
 
 
 
 
 
 
27
 
28
  st.set_page_config(page_title="Your Image to Audio Story",
29
  page_icon="🦜")
 
31
  uploaded_file = st.file_uploader("Select an Image...")
32
 
33
  if uploaded_file is not None:
34
+ print(uploaded_file)
 
35
  bytes_data = uploaded_file.getvalue()
36
+ with open(uploaded_file.name, "wb") as file:
37
  file.write(bytes_data)
38
+ st.image(uploaded_file, caption="Uploaded Image",
39
+ use_column_width=True)
40
 
41
+ #Stage 1: Image to Text
 
 
 
42
  st.text('Processing img2text...')
43
+ scenario = img2text(uploaded_file.name)
44
+ st.write(scenario)
 
45
 
46
+ #Stage 2: Text to Story
47
+ st.text('Generating a story...')
48
+ story = text2story(scenario)
49
+ st.write(story)
 
50
 
51
+ #Stage 3: Story to Audio data
52
+ st.text('Generating audio data...')
53
+ audio_file = text2audio(story)
 
 
 
 
54
 
55
+ # Play button
56
+ if st.button("Play Audio"):
57
+ with open(audio_file, "rb") as audio:
58
+ audio_bytes = audio.read()
59
+ st.audio(audio_bytes,
60
+ format="audio/wav",
61
+ start_time=0)
62
+ # 删除临时音频文件
63
+ if os.path.exists(audio_file):
64
+ os.remove(audio_file)