Spaces:
Running
Running
admin
commited on
Commit
·
36a6259
1
Parent(s):
5b8d4bb
2 pure en
Browse files- app.py +17 -18
- requirements.txt +3 -3
- utils.py +4 -10
app.py
CHANGED
|
@@ -8,22 +8,23 @@ import numpy as np
|
|
| 8 |
import gradio as gr
|
| 9 |
import librosa.display
|
| 10 |
import matplotlib.pyplot as plt
|
| 11 |
-
from utils import get_modelist, find_files, embed_img
|
| 12 |
from collections import Counter
|
| 13 |
from model import EvalNet
|
| 14 |
|
| 15 |
|
| 16 |
TRANSLATE = {
|
| 17 |
-
"vibrato": "
|
| 18 |
-
"upward_portamento": "
|
| 19 |
-
"downward_portamento": "
|
| 20 |
-
"returning_portamento": "
|
| 21 |
-
"glissando": "
|
| 22 |
-
"tremolo": "
|
| 23 |
-
"harmonics": "
|
| 24 |
-
"plucks": "
|
| 25 |
}
|
| 26 |
CLASSES = list(TRANSLATE.keys())
|
|
|
|
| 27 |
SAMPLE_RATE = 44100
|
| 28 |
|
| 29 |
|
|
@@ -146,7 +147,7 @@ def infer(wav_path: str, log_name: str, folder_path=TEMP_DIR):
|
|
| 146 |
shutil.rmtree(folder_path)
|
| 147 |
|
| 148 |
if not wav_path:
|
| 149 |
-
return None, "
|
| 150 |
|
| 151 |
try:
|
| 152 |
model = EvalNet(log_name, len(TRANSLATE)).model
|
|
@@ -182,27 +183,25 @@ if __name__ == "__main__":
|
|
| 182 |
gr.Interface(
|
| 183 |
fn=infer,
|
| 184 |
inputs=[
|
| 185 |
-
gr.Audio(label="
|
| 186 |
-
gr.Dropdown(
|
| 187 |
-
choices=models, label="选择模型 Select a model", value=models[0]
|
| 188 |
-
),
|
| 189 |
],
|
| 190 |
outputs=[
|
| 191 |
-
gr.Textbox(label="
|
| 192 |
gr.Textbox(
|
| 193 |
-
label="
|
| 194 |
show_copy_button=True,
|
| 195 |
),
|
| 196 |
],
|
| 197 |
examples=examples,
|
| 198 |
cache_examples=False,
|
| 199 |
flagging_mode="never",
|
| 200 |
-
title="
|
| 201 |
)
|
| 202 |
|
| 203 |
gr.Markdown(
|
| 204 |
"""
|
| 205 |
-
#
|
| 206 |
```bibtex
|
| 207 |
@dataset{zhaorui_liu_2021_5676893,
|
| 208 |
author = {Monan Zhou, Shenyang Xu, Zhaorui Liu, Zhaowen Wang, Feng Yu, Wei Li and Baoqiang Han},
|
|
|
|
| 8 |
import gradio as gr
|
| 9 |
import librosa.display
|
| 10 |
import matplotlib.pyplot as plt
|
| 11 |
+
from utils import get_modelist, find_files, embed_img
|
| 12 |
from collections import Counter
|
| 13 |
from model import EvalNet
|
| 14 |
|
| 15 |
|
| 16 |
TRANSLATE = {
|
| 17 |
+
"vibrato": "chan yin",
|
| 18 |
+
"upward_portamento": "shang hua yin",
|
| 19 |
+
"downward_portamento": "xia hua yin",
|
| 20 |
+
"returning_portamento": "hui hua yin",
|
| 21 |
+
"glissando": "gua zou, hua zhi",
|
| 22 |
+
"tremolo": "yao zhi",
|
| 23 |
+
"harmonics": "fan yin",
|
| 24 |
+
"plucks": "gou, da, mo, tuo, ...",
|
| 25 |
}
|
| 26 |
CLASSES = list(TRANSLATE.keys())
|
| 27 |
+
TEMP_DIR = "./__pycache__/tmp"
|
| 28 |
SAMPLE_RATE = 44100
|
| 29 |
|
| 30 |
|
|
|
|
| 147 |
shutil.rmtree(folder_path)
|
| 148 |
|
| 149 |
if not wav_path:
|
| 150 |
+
return None, "Please input an audio!"
|
| 151 |
|
| 152 |
try:
|
| 153 |
model = EvalNet(log_name, len(TRANSLATE)).model
|
|
|
|
| 183 |
gr.Interface(
|
| 184 |
fn=infer,
|
| 185 |
inputs=[
|
| 186 |
+
gr.Audio(label="Upload a recording", type="filepath"),
|
| 187 |
+
gr.Dropdown(choices=models, label="Select a model", value=models[0]),
|
|
|
|
|
|
|
| 188 |
],
|
| 189 |
outputs=[
|
| 190 |
+
gr.Textbox(label="Audio filename", show_copy_button=True),
|
| 191 |
gr.Textbox(
|
| 192 |
+
label="Guzheng playing tech recognition",
|
| 193 |
show_copy_button=True,
|
| 194 |
),
|
| 195 |
],
|
| 196 |
examples=examples,
|
| 197 |
cache_examples=False,
|
| 198 |
flagging_mode="never",
|
| 199 |
+
title="It is recommended to keep the recording length around 3s.",
|
| 200 |
)
|
| 201 |
|
| 202 |
gr.Markdown(
|
| 203 |
"""
|
| 204 |
+
# Cite
|
| 205 |
```bibtex
|
| 206 |
@dataset{zhaorui_liu_2021_5676893,
|
| 207 |
author = {Monan Zhou, Shenyang Xu, Zhaorui Liu, Zhaowen Wang, Feng Yu, Wei Li and Baoqiang Han},
|
requirements.txt
CHANGED
|
@@ -1,6 +1,6 @@
|
|
| 1 |
-
librosa
|
| 2 |
torch
|
|
|
|
|
|
|
| 3 |
matplotlib
|
| 4 |
torchvision
|
| 5 |
-
|
| 6 |
-
modelscope==1.15
|
|
|
|
|
|
|
| 1 |
torch
|
| 2 |
+
pillow
|
| 3 |
+
librosa
|
| 4 |
matplotlib
|
| 5 |
torchvision
|
| 6 |
+
modelscope[framework]==1.18
|
|
|
utils.py
CHANGED
|
@@ -5,10 +5,9 @@ from modelscope import snapshot_download
|
|
| 5 |
from PIL import Image
|
| 6 |
|
| 7 |
MODEL_DIR = snapshot_download(
|
| 8 |
-
|
| 9 |
-
cache_dir=
|
| 10 |
)
|
| 11 |
-
TEMP_DIR = f"{os.getcwd()}/flagged"
|
| 12 |
|
| 13 |
|
| 14 |
def toCUDA(x):
|
|
@@ -34,22 +33,17 @@ def get_modelist(model_dir=MODEL_DIR):
|
|
| 34 |
try:
|
| 35 |
entries = os.listdir(model_dir)
|
| 36 |
except OSError as e:
|
| 37 |
-
print(f"
|
| 38 |
return
|
| 39 |
|
| 40 |
-
# 遍历所有条目
|
| 41 |
output = []
|
| 42 |
for entry in entries:
|
| 43 |
-
# 获取完整路径
|
| 44 |
full_path = os.path.join(model_dir, entry)
|
| 45 |
-
# 跳过'.git'文件夹
|
| 46 |
if entry == ".git" or entry == "examples":
|
| 47 |
-
print(f"
|
| 48 |
continue
|
| 49 |
|
| 50 |
-
# 检查条目是文件还是目录
|
| 51 |
if os.path.isdir(full_path):
|
| 52 |
-
# 打印目录路径
|
| 53 |
output.append(os.path.basename(full_path))
|
| 54 |
|
| 55 |
return output
|
|
|
|
| 5 |
from PIL import Image
|
| 6 |
|
| 7 |
MODEL_DIR = snapshot_download(
|
| 8 |
+
"ccmusic-database/GZ_IsoTech",
|
| 9 |
+
cache_dir="./__pycache__",
|
| 10 |
)
|
|
|
|
| 11 |
|
| 12 |
|
| 13 |
def toCUDA(x):
|
|
|
|
| 33 |
try:
|
| 34 |
entries = os.listdir(model_dir)
|
| 35 |
except OSError as e:
|
| 36 |
+
print(f"Cannot access {model_dir}: {e}")
|
| 37 |
return
|
| 38 |
|
|
|
|
| 39 |
output = []
|
| 40 |
for entry in entries:
|
|
|
|
| 41 |
full_path = os.path.join(model_dir, entry)
|
|
|
|
| 42 |
if entry == ".git" or entry == "examples":
|
| 43 |
+
print(f"Skip .git or examples dir: {full_path}")
|
| 44 |
continue
|
| 45 |
|
|
|
|
| 46 |
if os.path.isdir(full_path):
|
|
|
|
| 47 |
output.append(os.path.basename(full_path))
|
| 48 |
|
| 49 |
return output
|