SandraCLV commited on
Commit
9853375
1 Parent(s): 76f44e6

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +21 -17
app.py CHANGED
@@ -1,22 +1,26 @@
1
  import gradio as gr
2
- from transformers import pipeline
3
- import speech_recognition as sr
 
 
4
 
5
- def transcribe_speech():
6
- r = sr.Recognizer()
 
 
7
 
8
- # Record Audio
9
- with sr.Microphone() as source:
10
- print("Habla ahora:")
11
- audio = r.listen(source)
 
12
 
13
- # Speech recognition using Google Speech Recognition
14
- try:
15
- text = r.recognize_google(audio, language='es-ES')
16
- print("Creo que dijiste: " + text)
17
- except sr.UnknownValueError:
18
- print("Google Speech Recognition no pudo entender el audio")
19
- except sr.RequestError as e:
20
- print("No se pudo solicitar resultados del servicio de Google Speech Recognition; {0}".format(e))
21
 
22
- transcribe_speech()
 
 
 
1
  import gradio as gr
2
+ from PIL import Image
3
+ import pytesseract
4
+ from gtts import gTTS
5
+ import os
6
 
7
+ # Funci贸n para convertir imagen a texto
8
+ def image_to_text(imagen):
9
+ texto = pytesseract.image_to_string(Image.open(imagen))
10
+ return texto
11
 
12
+ # Funci贸n para convertir texto a audio
13
+ def text_to_audio(texto):
14
+ audio = gTTS(text=texto, lang='es', slow=False)
15
+ audio.save("audio.mp3")
16
+ return "audio.mp3"
17
 
18
+ # Funci贸n que combina las dos funciones anteriores
19
+ def imagen_a_audio(imagen):
20
+ texto = image_to_text(imagen)
21
+ audio = text_to_audio(texto)
22
+ return audio
 
 
 
23
 
24
+ # Crear la interfaz de usuario con Gradio
25
+ iface = gr.Interface(fn=imagen_a_audio, inputs="Image", outputs="Audio")
26
+ iface.launch()