Spaces:

nineninesix
/

KaniTTS

Running on Zero

App Files Files Community

ylankgz commited on Sep 18

Commit

ad693da

1 Parent(s): 00e4cff

enable settings

Browse files

Files changed (2) hide show

app.py +8 -12
util.py +1 -1

app.py CHANGED Viewed

@@ -114,28 +114,24 @@ with gr.Blocks(title="😻 KaniTTS - Text to Speech", theme=gr.themes.Default())
             )
             with gr.Accordion("Settings", open=False):
-                temperature = gr.Slider(
                     minimum=0.1, maximum=1.5, value=0.6, step=0.05,
-                    label="Temperature",
-                    info="Higher values (0.7-1.0) create more expressive but less stable speech"
                 )
                 top_p = gr.Slider(
                     minimum=0.1, maximum=1.0, value=0.95, step=0.05,
                     label="Top P",
-                    info="Nucleus sampling threshold"
                 )
-                repetition_penalty = gr.Slider(
                     minimum=1.0, maximum=2.0, value=1.1, step=0.05,
                     label="Repetition Penalty",
-                    info="Higher values discourage repetitive patterns"
                 )
-                max_new_tokens = gr.Slider(
                     minimum=100, maximum=2000, value=1200, step=100,
-                    label="Max Length",
-                    info="Maximum length of generated audio (in tokens)"
                 )
-            generate_btn = gr.Button("🎵 Generate Speech", variant="primary", size="lg")
         with gr.Column(scale=1):
@@ -154,7 +150,7 @@ with gr.Blocks(title="😻 KaniTTS - Text to Speech", theme=gr.themes.Default())
     # GPU generation event
     generate_btn.click(
         fn=generate_speech_gpu,
-        inputs=[text_input, model_dropdown],
         outputs=[audio_output, time_report_output]
     )
@@ -178,7 +174,7 @@ with gr.Blocks(title="😻 KaniTTS - Text to Speech", theme=gr.themes.Default())
         gr.Examples(
             examples=examples,
-            inputs=[text_input, model_dropdown, temperature, top_p, repetition_penalty, max_new_tokens],
             fn=generate_speech_gpu,
             outputs=[audio_output, time_report_output],
             cache_examples=True,

             )
             with gr.Accordion("Settings", open=False):
+                temp = gr.Slider(
                     minimum=0.1, maximum=1.5, value=0.6, step=0.05,
+                    label="Temp",
                 )
                 top_p = gr.Slider(
                     minimum=0.1, maximum=1.0, value=0.95, step=0.05,
                     label="Top P",
                 )
+                rp = gr.Slider(
                     minimum=1.0, maximum=2.0, value=1.1, step=0.05,
                     label="Repetition Penalty",
                 )
+                max_tok = gr.Slider(
                     minimum=100, maximum=2000, value=1200, step=100,
+                    label="Max Tokens",
                 )
+            generate_btn = gr.Button("Run", variant="primary", size="lg")
         with gr.Column(scale=1):
     # GPU generation event
     generate_btn.click(
         fn=generate_speech_gpu,
+        inputs=[text_input, model_dropdown, temp, top_p, rp, max_tok],
         outputs=[audio_output, time_report_output]
     )
         gr.Examples(
             examples=examples,
+            inputs=[text_input, model_dropdown, temp, top_p, rp, max_tok],
             fn=generate_speech_gpu,
             outputs=[audio_output, time_report_output],
             cache_examples=True,

util.py CHANGED Viewed

@@ -197,7 +197,7 @@ class KaniModel:
         model_request = point_2 - point_1
         player_time = point_3 - point_2
         total_time = point_3 - point_1
-        report = f"SPEECH TOKENS: {model_request:.2f}\n CODEC: {player_time:.2f}\nTOTAL: {total_time:.2f}"
         return report
     def run_model(self, text: str):

         model_request = point_2 - point_1
         player_time = point_3 - point_2
         total_time = point_3 - point_1
+        report = f"SPEECH TOKENS: {model_request:.2f}\nCODEC: {player_time:.2f}\nTOTAL: {total_time:.2f}"
         return report
     def run_model(self, text: str):