Spaces:

Genius-Society
/

piano_trans

Running

App Files Files

admin commited on Apr 22

Commit

c73c29a

1 Parent(s): 215960c

sync ms

Browse files

Files changed (2) hide show

app.py +126 -77
requirements.txt +2 -1

app.py CHANGED Viewed

@@ -1,20 +1,51 @@
 import os
 import re
 import json
-import uuid
 import torch
 import shutil
 import requests
 import gradio as gr
 from piano_transcription_inference import PianoTranscription, load_audio, sample_rate
-from huggingface_hub import snapshot_download
 from urllib.parse import urlparse
 from convert import midi2xml, xml2abc, xml2mxl, xml2jpg
 WEIGHTS_PATH = (
-    snapshot_download("Genius-Society/piano_trans", cache_dir="./__pycache__")
-    + "/CRNN_note_F1=0.9677_pedal_F1=0.9186.pth"
-)
 def clean_cache(cache_dir):
@@ -34,15 +65,18 @@ def download_audio(url: str, save_path: str):
 def is_url(s: str):
     try:
         result = urlparse(s)
         return all([result.scheme, result.netloc])
     except:
         return False
 def audio2midi(audio_path: str, cache_dir: str):
-    audio, _ = load_audio(audio_path, sr=sample_rate)
     transcriptor = PianoTranscription(
         device="cuda" if torch.cuda.is_available() else "cpu",
         checkpoint_path=WEIGHTS_PATH,
@@ -52,25 +86,11 @@ def audio2midi(audio_path: str, cache_dir: str):
     return midi_path, os.path.basename(audio_path).split(".")[-2].capitalize()
-def upl_infer(audio_path: str, cache_dir="./__pycache__/mode1"):
-    clean_cache(cache_dir)
-    try:
-        print(audio_path)
-        midi, title = audio2midi(audio_path, cache_dir)
-        xml = midi2xml(midi, title)
-        abc = xml2abc(xml)
-        mxl = xml2mxl(xml)
-        pdf, jpg = xml2jpg(xml)
-        return midi, pdf, xml, mxl, abc, jpg
-    except Exception as e:
-        return None, None, None, None, f"{e}", None
-def get_1st_int(input_string: str):
     match = re.search(r"\d+", input_string)
     if match:
         return str(int(match.group()))
     else:
         return ""
@@ -79,9 +99,11 @@ def music163_song_info(id: str):
     detail_api = "https://music.163.com/api/v3/song/detail"
     parm_dict = {"id": id, "c": str([{"id": id}]), "csrf_token": ""}
     free = False
-    song_name = "Failed to get the song"
     response = requests.get(detail_api, params=parm_dict)
     if response.status_code == 200:
         data = json.loads(response.text)
         if data and "songs" in data and data["songs"]:
             fee = int(data["songs"][0]["fee"])
@@ -89,31 +111,48 @@ def music163_song_info(id: str):
             song_name = str(data["songs"][0]["name"])
         else:
-            song_name = "The song does not exist"
     else:
-        raise ConnectionError(f"Error: {response.status_code}, {response.text}")
     return song_name, free
 def url_infer(song: str, cache_dir="./__pycache__/mode2"):
     song_name = ""
-    clean_cache(cache_dir)
-    audio_path = f"/tmp/gradio/{uuid.uuid4().hex}/"
-    os.makedirs(audio_path, exist_ok=True)
     try:
         if (is_url(song) and "163" in song and "?id=" in song) or song.isdigit():
-            song_id = get_1st_int(song.split("?id=")[-1])
-            song_url = f"https://music.163.com/song/media/outer/url?id={song_id}.mp3"
             song_name, free = music163_song_info(song_id)
             if not free:
-                raise AttributeError("Unable to parse VIP songs")
-            audio_path += f"{song_id}.mp3"
-            download_audio(song_url, audio_path)
-        midi, title = audio2midi(audio_path, cache_dir)
         if song_name:
             title = song_name
@@ -121,54 +160,64 @@ def url_infer(song: str, cache_dir="./__pycache__/mode2"):
         abc = xml2abc(xml)
         mxl = xml2mxl(xml)
         pdf, jpg = xml2jpg(xml)
-        return audio_path, midi, pdf, xml, mxl, abc, jpg
     except Exception as e:
-        return None, None, None, None, None, f"{e}", None
 if __name__ == "__main__":
     with gr.Blocks() as iface:
-        gr.Markdown("# Piano Transcription Tool")
-        # with gr.Tab("Uploading Mode"):
-        gr.Interface(
-            fn=upl_infer,
-            inputs=gr.Audio(
-                label="Upload an audio",
-                type="filepath",
-            ),
-            outputs=[
-                gr.File(label="Download MIDI"),
-                gr.File(label="Download PDF score"),
-                gr.File(label="Download MusicXML"),
-                gr.File(label="Download MXL"),
-                gr.Textbox(label="ABC notation", show_copy_button=True),
-                gr.Image(label="Staff", type="filepath", show_share_button=False),
-            ],
-            description="Please make sure the audio is completely uploaded before clicking Submit",
-            flagging_mode="never",
-        )
-        # with gr.Tab("Direct Link Mode"):
-        #     gr.Interface(
-        #         fn=url_infer,
-        #         inputs=gr.Textbox(
-        #             label="Input audio direct link",
-        #             placeholder="https://music.163.com/#/song?id=",
-        #         ),
-        #         outputs=[
-        #             gr.Audio(label="Download audio", type="filepath"),
-        #             gr.File(label="Download MIDI"),
-        #             gr.File(label="Download PDF score"),
-        #             gr.File(label="Download MusicXML"),
-        #             gr.File(label="Download MXL"),
-        #             gr.Textbox(label="ABC notation", show_copy_button=True),
-        #             gr.Image(label="Staff", type="filepath"),
-        #         ],
-        #         description="For Netease Cloud music, you can directly input the non-VIP song page link",
-        #         examples=["1945798894", "1945798973", "1946098771"],
-        #         flagging_mode="never",
-        #         cache_examples=False,
-        #     )
     iface.launch()

 import os
 import re
 import json
 import torch
 import shutil
 import requests
+import modelscope
+import huggingface_hub
 import gradio as gr
 from piano_transcription_inference import PianoTranscription, load_audio, sample_rate
 from urllib.parse import urlparse
 from convert import midi2xml, xml2abc, xml2mxl, xml2jpg
+EN_US = os.getenv("LANG") != "zh_CN.UTF-8"
+ZH2EN = {
+    "上传模式": "Uploading Mode",
+    "上传音频": "Upload an audio",
+    "下载 MIDI": "Download MIDI",
+    "下载 PDF 乐谱": "Download PDF score",
+    "下载 MusicXML": "Download MusicXML",
+    "下载 MXL": "Download MXL",
+    "ABC 记谱": "ABC notation",
+    "五线谱": "Staff",
+    "状态栏": "Status",
+    "请上传音频 100% 后再点提交": "Please make sure the audio is completely uploaded before clicking Submit",
+    "直链模式": "Direct Link Mode",
+    "输入音频 URL 直链": "Input audio direct link",
+    "下载音频": "Download audio",
+    "网易云音乐可直接输入非 VIP 歌曲页面链接自动解析": "For Netease Cloud music, you can directly input the non-VIP song page link",
+    "# 钢琴转谱工具": "Piano Transcription Tool",
+}
 WEIGHTS_PATH = (
+    huggingface_hub.snapshot_download(
+        "Genius-Society/piano_trans",
+        cache_dir="./__pycache__",
+    )
+    if EN_US
+    else modelscope.snapshot_download(
+        "Genius-Society/piano_trans",
+        cache_dir="./__pycache__",
+    )
+) + "/CRNN_note_F1=0.9677_pedal_F1=0.9186.pth"
+def _L(zh_txt: str):
+    return ZH2EN[zh_txt] if EN_US else zh_txt
 def clean_cache(cache_dir):
 def is_url(s: str):
     try:
+        # 解析字符串
         result = urlparse(s)
+        # 检查scheme（如http, https）和netloc（域名）
         return all([result.scheme, result.netloc])
     except:
+        # 如果解析过程中发生异常，则返回False
         return False
 def audio2midi(audio_path: str, cache_dir: str):
+    audio, _ = load_audio(audio_path, sr=sample_rate, mono=True)
     transcriptor = PianoTranscription(
         device="cuda" if torch.cuda.is_available() else "cpu",
         checkpoint_path=WEIGHTS_PATH,
     return midi_path, os.path.basename(audio_path).split(".")[-2].capitalize()
+def get_first_integer(input_string: str):
     match = re.search(r"\d+", input_string)
     if match:
         return str(int(match.group()))
     else:
         return ""
     detail_api = "https://music.163.com/api/v3/song/detail"
     parm_dict = {"id": id, "c": str([{"id": id}]), "csrf_token": ""}
     free = False
+    song_name = "获取歌曲失败"
     response = requests.get(detail_api, params=parm_dict)
+    # 检查请求是否成功
     if response.status_code == 200:
+        # 处理成功响应
         data = json.loads(response.text)
         if data and "songs" in data and data["songs"]:
             fee = int(data["songs"][0]["fee"])
             song_name = str(data["songs"][0]["name"])
         else:
+            song_name = "歌曲不存在"
     else:
+        raise ConnectionError(f"错误: {response.status_code}, {response.text}")
     return song_name, free
+def upl_infer(audio_path: str, cache_dir="./__pycache__/mode1"):
+    status = "Success"
+    midi = pdf = xml = mxl = abc = jpg = None
+    try:
+        clean_cache(cache_dir)
+        midi, title = audio2midi(audio_path, cache_dir)
+        xml = midi2xml(midi, title)
+        abc = xml2abc(xml)
+        mxl = xml2mxl(xml)
+        pdf, jpg = xml2jpg(xml)
+    except Exception as e:
+        status = f"{e}"
+    return status, midi, pdf, xml, mxl, abc, jpg
 def url_infer(song: str, cache_dir="./__pycache__/mode2"):
     song_name = ""
+    status = "Success"
+    download_path = f"{cache_dir}/output.mp3"
+    midi = pdf = xml = mxl = abc = jpg = None
     try:
+        clean_cache(cache_dir)
         if (is_url(song) and "163" in song and "?id=" in song) or song.isdigit():
+            song_id = get_first_integer(song.split("?id=")[-1])
+            song = f"https://music.163.com/song/media/outer/url?id={song_id}.mp3"
             song_name, free = music163_song_info(song_id)
             if not free:
+                raise AttributeError("付费歌曲无法解析")
+            download_audio(song, download_path)
+        midi, title = audio2midi(download_path, cache_dir)
         if song_name:
             title = song_name
         abc = xml2abc(xml)
         mxl = xml2mxl(xml)
         pdf, jpg = xml2jpg(xml)
+        if not os.path.exists(download_path):
+            raise FileExistsError(f"{download_path} not exist")
     except Exception as e:
+        status = f"{e}"
+    return status, download_path, midi, pdf, xml, mxl, abc, jpg
 if __name__ == "__main__":
     with gr.Blocks() as iface:
+        gr.Markdown(_L("# 钢琴转谱工具"))
+        with gr.Tab(_L("上传模式")):
+            gr.Interface(
+                fn=upl_infer,
+                inputs=gr.Audio(label=_L("上传音频"), type="filepath"),
+                outputs=[
+                    gr.Textbox(label=_L("状态栏"), show_copy_button=True),
+                    gr.File(label=_L("下载 MIDI")),
+                    gr.File(label=_L("下载 PDF 乐谱")),
+                    gr.File(label=_L("下载 MusicXML")),
+                    gr.File(label=_L("下载 MXL")),
+                    gr.Textbox(label=_L("ABC 记谱"), show_copy_button=True),
+                    gr.Image(
+                        label=_L("五线谱"),
+                        type="filepath",
+                        show_share_button=False,
+                    ),
+                ],
+                title=_L("请上传音频 100% 后再点提交"),
+                flagging_mode="never",
+            )
+        with gr.Tab(_L("直链模式")):
+            gr.Interface(
+                fn=url_infer,
+                inputs=gr.Textbox(
+                    label=_L("输入音频 URL 直链"),
+                    placeholder="https://music.163.com/#/song?id=",
+                ),
+                outputs=[
+                    gr.Textbox(label=_L("状态栏"), show_copy_button=True),
+                    gr.Audio(label=_L("下载音频"), type="filepath"),
+                    gr.File(label=_L("下载 MIDI")),
+                    gr.File(label=_L("下载 PDF 乐谱")),
+                    gr.File(label=_L("下载 MusicXML")),
+                    gr.File(label=_L("���载 MXL")),
+                    gr.Textbox(label=_L("ABC 记谱"), show_copy_button=True),
+                    gr.Image(
+                        label=_L("五线谱"),
+                        type="filepath",
+                        show_share_button=False,
+                    ),
+                ],
+                title=_L("网易云音乐可直接输入非 VIP 歌曲页面链接自动解析"),
+                examples=["1945798894", "1945798973", "1946098771"],
+                flagging_mode="never",
+                cache_examples=False,
+            )
     iface.launch()

requirements.txt CHANGED Viewed

@@ -1,4 +1,5 @@
-torch
 pymupdf
 music21
 piano_transcription_inference

+torch==2.6.0+cu118
+-f https://download.pytorch.org/whl/torch
 pymupdf
 music21
 piano_transcription_inference