Spaces:

mtg-upf
/

audio-difficulty

Running on Zero

App Files Files Community

PRamoneda commited on May 16

Commit

2e9908b

1 Parent(s): 7243f55

debug

Browse files

Files changed (1) hide show

app.py +26 -35

app.py CHANGED Viewed

@@ -16,24 +16,16 @@ CACHE_BASE = "models"
 def download_model_checkpoints(model_name: str, num_checkpoints: int = 5):
     cache_dir = os.path.join(CACHE_BASE, model_name)
     os.makedirs(cache_dir, exist_ok=True)
     for checkpoint_id in range(num_checkpoints):
         filename = f"{model_name}/checkpoint_{checkpoint_id}.pth"
         local_path = os.path.join(cache_dir, f"checkpoint_{checkpoint_id}.pth")
         if not os.path.exists(local_path):
-            print(f"Downloading {filename} from {REPO_ID} to {cache_dir}")
-            path = hf_hub_download(
-                repo_id=REPO_ID,
-                filename=filename,
-                cache_dir=cache_dir
-            )
-            # Copy to expected location
             if path != local_path:
                 import shutil
                 shutil.copy(path, local_path)
-def download_youtube_audio(url):
     output_path = "yt_audio.%(ext)s"
     ydl_opts = {
         "format": "bestaudio/best",
@@ -46,6 +38,8 @@ def download_youtube_audio(url):
         "quiet": True,
         "no_warnings": True
     }
     with yt_dlp.YoutubeDL(ydl_opts) as ydl:
         ydl.download([url])
@@ -58,39 +52,31 @@ def convert_to_mp3(input_path):
     audio.export(temp_audio.name, format="mp3")
     return temp_audio.name
-def process_input(input_file, youtube_url):
     captured_output = io.StringIO()
     sys.stdout = captured_output
-    audio_path = None
-    mp3_path = None
     if youtube_url:
-        audio_path = download_youtube_audio(youtube_url)
         mp3_path = audio_path
     elif input_file:
         mime_type, _ = mimetypes.guess_type(input_file)
-        if mime_type and mime_type.startswith("video/"):
-            audio_path = convert_to_mp3(input_file)
-            mp3_path = audio_path
-        else:
-            audio_path = convert_to_mp3(input_file)
-            mp3_path = audio_path
     else:
         sys.stdout = sys.__stdout__
-        return "No audio or video provided.", None, None, None
-    model_cqt = "audio_midi_cqt5_ps_v5"
-    model_pr = "audio_midi_pianoroll_ps_5_v4"
-    model_multi = "audio_midi_multi_ps_v5"
-    download_model_checkpoints(model_cqt)
-    download_model_checkpoints(model_pr)
-    download_model_checkpoints(model_multi)
-    diff_cqt = predict_difficulty(audio_path, model_name=model_cqt, rep="cqt5")
-    diff_pr = predict_difficulty(audio_path, model_name=model_pr, rep="pianoroll5")
-    diff_multi = predict_difficulty(audio_path, model_name=model_multi, rep="multimodal5")
     sys.stdout = sys.__stdout__
     log_output = captured_output.getvalue()
@@ -111,7 +97,8 @@ demo = gr.Interface(
     fn=process_input,
     inputs=[
         gr.File(label="Upload MP3 or MP4", type="filepath"),
-        gr.Textbox(label="YouTube URL")
     ],
     outputs=[
         gr.Textbox(label="Difficulty predictions"),
@@ -121,8 +108,12 @@ demo = gr.Interface(
         gr.Textbox(label="Console Output")
     ],
     title="Music Difficulty Estimator",
-    description="Upload an MP3, MP4, or provide a YouTube URL. It extracts audio, predicts difficulty, and generates a MIDI file."
 )
 if __name__ == "__main__":
-    demo.launch(debug=True, share=True)

 def download_model_checkpoints(model_name: str, num_checkpoints: int = 5):
     cache_dir = os.path.join(CACHE_BASE, model_name)
     os.makedirs(cache_dir, exist_ok=True)
     for checkpoint_id in range(num_checkpoints):
         filename = f"{model_name}/checkpoint_{checkpoint_id}.pth"
         local_path = os.path.join(cache_dir, f"checkpoint_{checkpoint_id}.pth")
         if not os.path.exists(local_path):
+            path = hf_hub_download(repo_id=REPO_ID, filename=filename, cache_dir=cache_dir)
             if path != local_path:
                 import shutil
                 shutil.copy(path, local_path)
+def download_youtube_audio(url, cookie_file=None):
     output_path = "yt_audio.%(ext)s"
     ydl_opts = {
         "format": "bestaudio/best",
         "quiet": True,
         "no_warnings": True
     }
+    if cookie_file:
+        ydl_opts["cookiefile"] = cookie_file  # <-- usa el archivo de cookies
     with yt_dlp.YoutubeDL(ydl_opts) as ydl:
         ydl.download([url])
     audio.export(temp_audio.name, format="mp3")
     return temp_audio.name
+def process_input(input_file, youtube_url, cookie_file):
+    # captura consola
     captured_output = io.StringIO()
     sys.stdout = captured_output
+    # procesa audio/video
     if youtube_url:
+        audio_path = download_youtube_audio(youtube_url, cookie_file)
         mp3_path = audio_path
     elif input_file:
         mime_type, _ = mimetypes.guess_type(input_file)
+        audio_path = convert_to_mp3(input_file)
+        mp3_path = audio_path
     else:
         sys.stdout = sys.__stdout__
+        return "No audio or video provided.", None, None, None, ""
+    # descarga checkpoints
+    for model in ["audio_midi_cqt5_ps_v5", "audio_midi_pianoroll_ps_5_v4", "audio_midi_multi_ps_v5"]:
+        download_model_checkpoints(model)
+    # predicciones
+    diff_cqt = predict_difficulty(audio_path, model_name="audio_midi_cqt5_ps_v5", rep="cqt5")
+    diff_pr = predict_difficulty(audio_path, model_name="audio_midi_pianoroll_ps_5_v4", rep="pianoroll5")
+    diff_multi = predict_difficulty(audio_path, model_name="audio_midi_multi_ps_v5", rep="multimodal5")
     sys.stdout = sys.__stdout__
     log_output = captured_output.getvalue()
     fn=process_input,
     inputs=[
         gr.File(label="Upload MP3 or MP4", type="filepath"),
+        gr.Textbox(label="YouTube URL"),
+        gr.File(label="Upload cookies.txt (optional)", file_types=["text"], type="filepath")
     ],
     outputs=[
         gr.Textbox(label="Difficulty predictions"),
         gr.Textbox(label="Console Output")
     ],
     title="Music Difficulty Estimator",
+    description=(
+        "Upload an MP3/MP4 or provide a YouTube URL. "
+        "If the video is age-restricted, export your YouTube cookies as a Netscape-format file "
+        "and upload it here. Then the app can download and process the audio."
+    )
 )
 if __name__ == "__main__":
+    demo.launch(debug=True)