mirror of
https://github.com/RVC-Project/Retrieval-based-Voice-Conversion-WebUI.git
synced 2025-05-06 20:01:37 +08:00
fix(hash): use precise npz instead of mp3
This commit is contained in:
parent
ade937b86a
commit
0f36233017
@ -5,7 +5,6 @@ import pathlib
|
|||||||
from scipy.fft import fft
|
from scipy.fft import fft
|
||||||
from pybase16384 import encode_to_string, decode_from_string
|
from pybase16384 import encode_to_string, decode_from_string
|
||||||
|
|
||||||
from infer.lib.audio import load_audio
|
|
||||||
from configs import CPUConfig, singleton_variable
|
from configs import CPUConfig, singleton_variable
|
||||||
|
|
||||||
from .pipeline import Pipeline
|
from .pipeline import Pipeline
|
||||||
@ -28,24 +27,21 @@ class TorchSeedContext:
|
|||||||
half_hash_len = 512
|
half_hash_len = 512
|
||||||
expand_factor = 65536 * 8
|
expand_factor = 65536 * 8
|
||||||
|
|
||||||
|
@singleton_variable
|
||||||
|
def original_audio_storage():
|
||||||
|
return np.load(pathlib.Path(__file__).parent / "lgdsng.npz")
|
||||||
|
|
||||||
|
@singleton_variable
|
||||||
|
def original_audio():
|
||||||
|
return original_audio_storage()["a"]
|
||||||
|
|
||||||
@singleton_variable
|
@singleton_variable
|
||||||
def original_audio_time_minus():
|
def original_audio_time_minus():
|
||||||
__original_audio = load_audio(
|
return original_audio_storage()["t"]
|
||||||
str(pathlib.Path(__file__).parent / "lgdsng.mp3"), 16000
|
|
||||||
)
|
|
||||||
np.divide(__original_audio, np.abs(__original_audio).max(), __original_audio)
|
|
||||||
return -__original_audio
|
|
||||||
|
|
||||||
|
|
||||||
@singleton_variable
|
@singleton_variable
|
||||||
def original_audio_freq_minus():
|
def original_audio_freq_minus():
|
||||||
__original_audio = load_audio(
|
return original_audio_storage()["f"]
|
||||||
str(pathlib.Path(__file__).parent / "lgdsng.mp3"), 16000
|
|
||||||
)
|
|
||||||
np.divide(__original_audio, np.abs(__original_audio).max(), __original_audio)
|
|
||||||
__original_audio = fft(__original_audio)
|
|
||||||
return -__original_audio
|
|
||||||
|
|
||||||
|
|
||||||
def _cut_u16(n):
|
def _cut_u16(n):
|
||||||
@ -85,13 +81,9 @@ def wave_hash(time_field):
|
|||||||
return encode_to_string(hash.tobytes())
|
return encode_to_string(hash.tobytes())
|
||||||
|
|
||||||
|
|
||||||
def audio_hash(file):
|
|
||||||
return wave_hash(load_audio(file, 16000))
|
|
||||||
|
|
||||||
|
|
||||||
def model_hash(config, tgt_sr, net_g, if_f0, version):
|
def model_hash(config, tgt_sr, net_g, if_f0, version):
|
||||||
pipeline = Pipeline(tgt_sr, config)
|
pipeline = Pipeline(tgt_sr, config)
|
||||||
audio = load_audio(str(pathlib.Path(__file__).parent / "lgdsng.mp3"), 16000)
|
audio = original_audio()
|
||||||
audio_max = np.abs(audio).max() / 0.95
|
audio_max = np.abs(audio).max() / 0.95
|
||||||
if audio_max > 1:
|
if audio_max > 1:
|
||||||
np.divide(audio, audio_max, audio)
|
np.divide(audio, audio_max, audio)
|
||||||
|
Binary file not shown.
BIN
infer/modules/vc/lgdsng.npz
Normal file
BIN
infer/modules/vc/lgdsng.npz
Normal file
Binary file not shown.
Loading…
x
Reference in New Issue
Block a user