Robust model for vocal pitch estimation.
from mirbox.pitch import RMVPE model = RMVPE(device="cuda") result = model("input.wav") print(result["f0"])
model.pt
-