Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
@@ -3,17 +3,17 @@ from transformers import AutoProcessor, BlipForConditionalGeneration, AutoTokeni
|
|
3 |
import librosa
|
4 |
import numpy as np
|
5 |
import torch
|
6 |
-
import image_text_model
|
7 |
-
import audio_model
|
8 |
import open_clip
|
9 |
|
10 |
#CONSTANTS
|
11 |
|
12 |
def generate_captions_speech(image):
|
13 |
|
14 |
-
caption_blip_large = generate_caption(blip_processor_large, blip_model_large, image)
|
15 |
print('generate_captions>>>'+caption_blip_large)
|
16 |
-
return caption_blip_large,text_to_speech(caption_blip_large,"Surprise Me!")
|
17 |
|
18 |
|
19 |
# Define la interfaz de usuario utilizando Gradio entradas y salidas
|
|
|
3 |
import librosa
|
4 |
import numpy as np
|
5 |
import torch
|
6 |
+
import image_text_model as itm
|
7 |
+
import audio_model as am
|
8 |
import open_clip
|
9 |
|
10 |
#CONSTANTS
|
11 |
|
12 |
def generate_captions_speech(image):
|
13 |
|
14 |
+
caption_blip_large = itm.generate_caption(blip_processor_large, blip_model_large, image)
|
15 |
print('generate_captions>>>'+caption_blip_large)
|
16 |
+
return caption_blip_large,am.text_to_speech(caption_blip_large,"Surprise Me!")
|
17 |
|
18 |
|
19 |
# Define la interfaz de usuario utilizando Gradio entradas y salidas
|