sk007msd commited on
Commit
69a9db6
·
verified ·
1 Parent(s): 4e97447

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +27 -7
app.py CHANGED
@@ -1,15 +1,15 @@
1
- import os
2
- import time
3
  import requests
4
- import gradio as gr
5
  from huggingface_hub import login
6
  from dotenv import load_dotenv
7
 
8
  load_dotenv()
9
- image_API="https://api-inference.huggingface.co/models/black-forest-labs/FLUX.1-schnell"
10
  translation_API="https://api-inference.huggingface.co/models/facebook/nllb-200-distilled-1.3B"
11
  whisper_API="https://api-inference.huggingface.co/models/openai/whisper-large-v3"
12
-
13
  HF_TOKEN=os.getenv("HF_Token")
14
  login(HF_TOKEN)
15
  headers={"Authorization":f"Bearer {HF_TOKEN}"}
@@ -49,6 +49,24 @@ def query_image(prompt):
49
  time.sleep(delay)
50
  return None
51
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
52
  def process_audio(audio_path):
53
  if not audio_path:
54
  return None
@@ -58,7 +76,8 @@ def process_audio(audio_path):
58
  translation=query_translation(tamil_text)
59
  translated_text=translation.get("translated_text","Translation error")
60
  image_path=query_image(translated_text)
61
- return tamil_text,translated_text,image_path
 
62
  except Exception as e:
63
  return None,str(e),None
64
 
@@ -69,7 +88,8 @@ iface=gr.Interface(
69
  gr.Textbox(label="Tamil Text"),
70
  gr.Textbox(label="English Translation"),
71
  gr.Image(label="Generated Image")
 
72
  ],
73
  title="Speech-to-Image Generation"
74
  )
75
- iface.launch(share=True,server_name="0.0.0.0",server_port=7860)
 
1
+ import os
2
+ import time
3
  import requests
4
+ import gradio as gr
5
  from huggingface_hub import login
6
  from dotenv import load_dotenv
7
 
8
  load_dotenv()
9
+ image_API="https://api-inference.huggingface.co/models/stabilityai/stable-diffusion-2"
10
  translation_API="https://api-inference.huggingface.co/models/facebook/nllb-200-distilled-1.3B"
11
  whisper_API="https://api-inference.huggingface.co/models/openai/whisper-large-v3"
12
+ txt_API="https://api-inference.huggingface.co/models/meta-llama/Llama-3.2-1B"
13
  HF_TOKEN=os.getenv("HF_Token")
14
  login(HF_TOKEN)
15
  headers={"Authorization":f"Bearer {HF_TOKEN}"}
 
49
  time.sleep(delay)
50
  return None
51
 
52
+ def query_text_generation(prompt):
53
+ max_retries=5
54
+ delay=10
55
+ payload={"inputs":f"give me a short story about {prompt}"}
56
+ for attempt in range(max_retries):
57
+ response=requests.post(txt_API,headers=headers,json=payload)
58
+ if response.status_code == 200:
59
+ result=response.json()
60
+ if isinstance(result,list) and len(result)>0:
61
+ return result[0].get("generated_text","Text Generation Error")
62
+ elif isinstance(result,dict) and "generated_text" in result:
63
+ return result["generated_text"]
64
+ print(f"⚠️ Text generation failed, retrying in {delay} seconds...")
65
+ time.sleep(delay)
66
+ return None
67
+
68
+
69
+
70
  def process_audio(audio_path):
71
  if not audio_path:
72
  return None
 
76
  translation=query_translation(tamil_text)
77
  translated_text=translation.get("translated_text","Translation error")
78
  image_path=query_image(translated_text)
79
+ story=query_text_generation(translated_text)
80
+ return tamil_text,translated_text,image_path,story
81
  except Exception as e:
82
  return None,str(e),None
83
 
 
88
  gr.Textbox(label="Tamil Text"),
89
  gr.Textbox(label="English Translation"),
90
  gr.Image(label="Generated Image")
91
+ gr.Textbox(label="Story")
92
  ],
93
  title="Speech-to-Image Generation"
94
  )
95
+ iface.launch(share=True,server_name="0.0.0.0",server_port=7861)