Natthathida commited on
Commit
7be5d5e
·
verified ·
1 Parent(s): 79d2f90

delete comment

Browse files
Files changed (1) hide show
  1. app.py +0 -43
app.py CHANGED
@@ -1,46 +1,3 @@
1
- # from transformers import pipeline, BlipForConditionalGeneration, BlipProcessor, AutoTokenizer, AutoModelForSeq2SeqLM
2
- # import torchaudio
3
- # from torchaudio.transforms import Resample
4
- # import torch
5
- # from flask import Flask, request, jsonify
6
- # # from PLI import Image
7
- # # import pytesseract
8
- # # import gradio as gr
9
-
10
- # app = Flask(__name__)
11
-
12
- # # Initialize TTS model from Hugging Face
13
- # tts_model_name = "suno/bark"
14
- # tts = pipeline(task="text-to-speech", model=tts_model_name)
15
-
16
- # # Initialize Blip model for image captioning
17
- # model_id = "dblasko/blip-dalle3-img2prompt"
18
- # blip_model = BlipForConditionalGeneration.from_pretrained(model_id)
19
- # blip_processor = BlipProcessor.from_pretrained(model_id)
20
-
21
- # @app.route('/generate_caption_and_audio', methods=['POST'])
22
- # def generate_caption ():
23
- # try:
24
- # # Get image file from the request
25
- # image = request.files['image']
26
-
27
- # # Generate caption from image using Blip model
28
- # inputs = blip_processor(images=image, return_tensors="pt")
29
- # pixel_values = inputs.pixel_values
30
- # generated_ids = blip_model.generate(pixel_values=pixel_values, max_length=50)
31
- # generated_caption = blip_processor.batch_decode(generated_ids, skip_special_tokens=True, temperature=0.8, top_k=40, top_p=0.9)[0]
32
-
33
- # # Use TTS model to convert generated caption to audio
34
- # audio_output = tts(generated_caption)
35
- # audio_path = "generated_audio_resampled.wav"
36
- # torchaudio.save(audio_path, torch.tensor(audio_output[0]), audio_output["sampling_rate"])
37
-
38
- # return jsonify({'generate_caption': generate_caption, 'audio_path': audio_path})
39
- # except Exception as e:
40
- # return jsonify({'error': str(e)})
41
-
42
- # if __name__ == '__main__':
43
- # app.run(debug=True)
44
  from flask import Flask, request, jsonify
45
  from transformers import pipeline, BlipForConditionalGeneration, BlipProcessor
46
  import torchaudio
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
  from flask import Flask, request, jsonify
2
  from transformers import pipeline, BlipForConditionalGeneration, BlipProcessor
3
  import torchaudio