Spaces:

11mlabs
/

IndriVoice

Running

skriller18 commited on Nov 26, 2024

Commit

7c4c876

1 Parent(s): f1884d8

Dropdown Added

Files changed (1) hide show

app.py CHANGED Viewed

@@ -3,10 +3,6 @@ import torchaudio
 from transformers import pipeline
 import streamlit as st
-x = st.slider('Select a value')
-st.write(x, 'squared is', x * x)
 model_id = '11mlabs/indri-0.1-124m-tts'
 task = 'indri-tts'
@@ -17,14 +13,33 @@ pipe = pipeline(
     trust_remote_code=True
 )
-text_input = st.text_area("Enter text for TTS (max 200 characters):", max_chars=200)
-speaker_name = st.text_input("Enter speaker's name:")
 if st.button("Generate Audio"):
     if text_input:
-        output = pipe([text_input], speaker=speaker_name)
         torchaudio.save('output.wav', output[0]['audio'][0], sample_rate=24000)
-        st.audio('output.wav')  # Display audio blob output
     else:
         st.warning("Please enter text to generate audio.")

 from transformers import pipeline
 import streamlit as st
 model_id = '11mlabs/indri-0.1-124m-tts'
 task = 'indri-tts'
     trust_remote_code=True
 )
+st.title("Indri")
+st.subheader("Ultrafast multi-modal AI")
+speakers = {
+    "[spkr_63] : 🇬🇧 👨 book reader",
+    "[spkr_67] : 🇺🇸 👨 influencer",
+    "[spkr_68] : 🇮🇳 👨 book reader",
+    "[spkr_69] : 🇮🇳 👨 book reader",
+    "[spkr_70] : 🇮🇳 👨 motivational speaker",
+    "[spkr_62] : 🇮🇳 👨 book reader heavy",
+    "[spkr_53] : 🇮🇳 👩 recipe reciter",
+    "[spkr_60] : 🇮🇳 👩 book reader",
+    "[spkr_74] : 🇺🇸 👨 book reader",
+    "[spkr_75] : 🇮🇳 👨 entrepreneur",
+    "[spkr_76] : 🇬🇧 👨 nature lover",
+    "[spkr_77] : 🇮🇳 👨 influencer",
+    "[spkr_66] : 🇮🇳 👨 politician"
+}
+speaker_id = st.selectbox("Select a speaker:", options=list(speakers.keys()), format_func=lambda x: speakers[x])
+text_input = st.text_area("Enter text for TTS (max 200 characters):", max_chars=200)
 if st.button("Generate Audio"):
     if text_input:
+        output = pipe([text_input], speaker=speaker_id)
         torchaudio.save('output.wav', output[0]['audio'][0], sample_rate=24000)
+        st.audio('output.wav')
     else:
         st.warning("Please enter text to generate audio.")