so-vits-svc/preprocess_hubert_f0.py

import argparse
import logging
import os
import random
from concurrent.futures import ProcessPoolExecutor
from glob import glob
from random import shuffle

import librosa
import numpy as np
import torch
import torch.multiprocessing as mp
from loguru import logger
from tqdm import tqdm

import diffusion.logger.utils as du
import utils
from diffusion.vocoder import Vocoder
from modules.mel_processing import spectrogram_torch

logging.getLogger("numba").setLevel(logging.WARNING)
logging.getLogger("matplotlib").setLevel(logging.WARNING)

hps = utils.get_hparams_from_file("configs/config.json")
dconfig = du.load_config("configs/diffusion.yaml")
sampling_rate = hps.data.sampling_rate
hop_length = hps.data.hop_length
speech_encoder = hps["model"]["speech_encoder"]


def process_one(filename, hmodel,f0p,rank,diff=False,mel_extractor=None):
    wav, sr = librosa.load(filename, sr=sampling_rate)
    audio_norm = torch.FloatTensor(wav)
    audio_norm = audio_norm.unsqueeze(0)
    device = torch.device(f"cuda:{rank}")
    soft_path = filename + ".soft.pt"
    if not os.path.exists(soft_path):
        wav16k = librosa.resample(wav, orig_sr=sampling_rate, target_sr=16000)
        wav16k = torch.from_numpy(wav16k).to(device)
        c = hmodel.encoder(wav16k)
        torch.save(c.cpu(), soft_path)

    f0_path = filename + ".f0.npy"
    if not os.path.exists(f0_path):
        f0_predictor = utils.get_f0_predictor(f0p,sampling_rate=sampling_rate, hop_length=hop_length,device=None,threshold=0.05)
        f0,uv = f0_predictor.compute_f0_uv(
            wav
        )
        np.save(f0_path, np.asanyarray((f0,uv),dtype=object))


    spec_path = filename.replace(".wav", ".spec.pt")
    if not os.path.exists(spec_path):
        # Process spectrogram
        # The following code can't be replaced by torch.FloatTensor(wav)
        # because load_wav_to_torch return a tensor that need to be normalized

        if sr != hps.data.sampling_rate:
            raise ValueError(
                "{} SR doesn't match target {} SR".format(
                    sr, hps.data.sampling_rate
                )
            )

        #audio_norm = audio / hps.data.max_wav_value

        spec = spectrogram_torch(
            audio_norm,
            hps.data.filter_length,
            hps.data.sampling_rate,
            hps.data.hop_length,
            hps.data.win_length,
            center=False,
        )
        spec = torch.squeeze(spec, 0)
        torch.save(spec, spec_path)

    if diff or hps.model.vol_embedding:
        volume_path = filename + ".vol.npy"
        volume_extractor = utils.Volume_Extractor(hop_length)
        if not os.path.exists(volume_path):
            volume = volume_extractor.extract(audio_norm)
            np.save(volume_path, volume.to('cpu').numpy())

    if diff:
        mel_path = filename + ".mel.npy"
        if not os.path.exists(mel_path) and mel_extractor is not None:
            mel_t = mel_extractor.extract(audio_norm.to(device), sampling_rate)
            mel = mel_t.squeeze().to('cpu').numpy()
            np.save(mel_path, mel)
        aug_mel_path = filename + ".aug_mel.npy"
        aug_vol_path = filename + ".aug_vol.npy"
        max_amp = float(torch.max(torch.abs(audio_norm))) + 1e-5
        max_shift = min(1, np.log10(1/max_amp))
        log10_vol_shift = random.uniform(-1, max_shift)
        keyshift = random.uniform(-5, 5)
        if mel_extractor is not None:
            aug_mel_t = mel_extractor.extract(audio_norm * (10 ** log10_vol_shift), sampling_rate, keyshift = keyshift)
        aug_mel = aug_mel_t.squeeze().to('cpu').numpy()
        aug_vol = volume_extractor.extract(audio_norm * (10 ** log10_vol_shift))
        if not os.path.exists(aug_mel_path):
            np.save(aug_mel_path,np.asanyarray((aug_mel,keyshift),dtype=object))
        if not os.path.exists(aug_vol_path):
            np.save(aug_vol_path,aug_vol.to('cpu').numpy())


def process_batch(file_chunk, f0p, diff=False, mel_extractor=None, device="cpu"):
    logger.info("Loading speech encoder for content...")
    rank = mp.current_process()._identity
    rank = rank[0] if len(rank) > 0 else 0
    if torch.cuda.is_available():
        gpu_id = rank % torch.cuda.device_count()
        device = torch.device(f"cuda:{gpu_id}")
    logger.info(f"Rank {rank} uses device {device}")
    hmodel = utils.get_speech_encoder(speech_encoder, device=device)
    logger.info(f"Loaded speech encoder for rank {rank}")
    for filename in tqdm(file_chunk):
        process_one(filename, hmodel, f0p, gpu_id, diff, mel_extractor)

def parallel_process(filenames, num_processes, f0p, diff, mel_extractor, device):
    with ProcessPoolExecutor(max_workers=num_processes) as executor:
        tasks = []
        for i in range(num_processes):
            start = int(i * len(filenames) / num_processes)
            end = int((i + 1) * len(filenames) / num_processes)
            file_chunk = filenames[start:end]
            tasks.append(executor.submit(process_batch, file_chunk, f0p, diff, mel_extractor, device=device))
        for task in tqdm(tasks):
            task.result()

if __name__ == "__main__":
    parser = argparse.ArgumentParser()
    parser.add_argument('-d', '--device', type=str, default=None)
    parser.add_argument(
        "--in_dir", type=str, default="dataset/44k", help="path to input dir"
    )
    parser.add_argument(
        '--use_diff',action='store_true', help='Whether to use the diffusion model'
    )
    parser.add_argument(
        '--f0_predictor', type=str, default="dio", help='Select F0 predictor, can select crepe,pm,dio,harvest,rmvpe,fcpe|default: pm(note: crepe is original F0 using mean filter)'
    )
    parser.add_argument(
        '--num_processes', type=int, default=1, help='You are advised to set the number of processes to the same as the number of CPU cores'
    )
    args = parser.parse_args()
    f0p = args.f0_predictor
    device = args.device
    if device is None:
        device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")

    print(speech_encoder)
    logger.info("Using device: ", device)
    logger.info("Using SpeechEncoder: " + speech_encoder)
    logger.info("Using extractor: " + f0p)
    logger.info("Using diff Mode: " + str( args.use_diff))

    if args.use_diff:
        print("use_diff")
        print("Loading Mel Extractor...")
        mel_extractor = Vocoder(dconfig.vocoder.type, dconfig.vocoder.ckpt, device=device)
        print("Loaded Mel Extractor.")
    else:
        mel_extractor = None
    filenames = glob(f"{args.in_dir}/*/*.wav", recursive=True)  # [:10]
    shuffle(filenames)
    mp.set_start_method("spawn", force=True)

    num_processes = args.num_processes
    if num_processes == 0:
        num_processes = os.cpu_count()

    parallel_process(filenames, num_processes, f0p, args.use_diff, mel_extractor, device)
chore: code cleanup by `ruff fix` 2023-06-26 06:57:53 +00:00			`import argparse`
			`import logging`
upload code 2023-03-10 10:11:04 +00:00			`import os`
diff 2023-05-16 05:17:51 +00:00			`import random`
chore: code cleanup by `ruff fix` 2023-06-26 06:57:53 +00:00			`from concurrent.futures import ProcessPoolExecutor`
			`from glob import glob`
			`from random import shuffle`
Update preprocess_hubert_f0.py Co-authored-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com> 2023-07-22 06:55:20 +00:00
并行执行预处理，处理速度或将提升，整理部分代码 (#230) * 使用多线程来进行预处理，速度或将大幅提升，使用方法为 --use_thread <线程数> * 并行执行预处理，处理速度或将提升，整理部分代码 * 修正kl_loss计算公式 * resample使用多进程，preprocess_hubert_f0使用旧的并行方式（尝试共享模型失败） 2023-06-19 19:38:13 +00:00			`import librosa`
			`import numpy as np`
chore: code cleanup by `ruff fix` 2023-06-26 06:57:53 +00:00			`import torch`
ruff fix 2023-07-22 12:18:20 +00:00			`import torch.multiprocessing as mp`
ruff fix 2023-07-22 15:02:52 +00:00			`from loguru import logger`
upload code 2023-03-10 10:11:04 +00:00			`from tqdm import tqdm`
chore: code cleanup by `ruff fix` 2023-06-26 06:57:53 +00:00
			`import diffusion.logger.utils as du`
			`import utils`
并行执行预处理，处理速度或将提升，整理部分代码 (#230) * 使用多线程来进行预处理，速度或将大幅提升，使用方法为 --use_thread <线程数> * 并行执行预处理，处理速度或将提升，整理部分代码 * 修正kl_loss计算公式 * resample使用多进程，preprocess_hubert_f0使用旧的并行方式（尝试共享模型失败） 2023-06-19 19:38:13 +00:00			`from diffusion.vocoder import Vocoder`
remove redundent spec_gen and fix related bug 2023-03-24 05:00:14 +00:00			`from modules.mel_processing import spectrogram_torch`
upload code 2023-03-10 10:11:04 +00:00
remove redundent spec_gen and fix related bug 2023-03-24 05:00:14 +00:00			`logging.getLogger("numba").setLevel(logging.WARNING)`
diff 2023-05-16 05:17:51 +00:00			`logging.getLogger("matplotlib").setLevel(logging.WARNING)`

upload code 2023-03-10 10:11:04 +00:00			`hps = utils.get_hparams_from_file("configs/config.json")`
diff 2023-05-16 05:17:51 +00:00			`dconfig = du.load_config("configs/diffusion.yaml")`
upload code 2023-03-10 10:11:04 +00:00			`sampling_rate = hps.data.sampling_rate`
			`hop_length = hps.data.hop_length`
Debug 2023-05-14 07:22:20 +00:00			`speech_encoder = hps["model"]["speech_encoder"]`
upload code 2023-03-10 10:11:04 +00:00
diff 2023-05-16 05:17:51 +00:00
Update preprocess_hubert_f0.py 2023-07-22 13:36:27 +00:00			`def process_one(filename, hmodel,f0p,rank,diff=False,mel_extractor=None):`
upload code 2023-03-10 10:11:04 +00:00			`wav, sr = librosa.load(filename, sr=sampling_rate)`
diff 2023-05-16 05:17:51 +00:00			`audio_norm = torch.FloatTensor(wav)`
			`audio_norm = audio_norm.unsqueeze(0)`
Update preprocess_hubert_f0.py 2023-07-22 13:34:11 +00:00			`device = torch.device(f"cuda:{rank}")`
upload code 2023-03-10 10:11:04 +00:00			`soft_path = filename + ".soft.pt"`
			`if not os.path.exists(soft_path):`
			`wav16k = librosa.resample(wav, orig_sr=sampling_rate, target_sr=16000)`
Correct typos in preprocess_hubert_f0.py 2023-03-16 23:10:47 +00:00			`wav16k = torch.from_numpy(wav16k).to(device)`
Updata Encoder class 2023-05-14 06:39:07 +00:00			`c = hmodel.encoder(wav16k)`
upload code 2023-03-10 10:11:04 +00:00			`torch.save(c.cpu(), soft_path)`
并行执行预处理，处理速度或将提升，整理部分代码 (#230) * 使用多线程来进行预处理，速度或将大幅提升，使用方法为 --use_thread <线程数> * 并行执行预处理，处理速度或将提升，整理部分代码 * 修正kl_loss计算公式 * resample使用多进程，preprocess_hubert_f0使用旧的并行方式（尝试共享模型失败） 2023-06-19 19:38:13 +00:00
upload code 2023-03-10 10:11:04 +00:00			`f0_path = filename + ".f0.npy"`
			`if not os.path.exists(f0_path):`
Updata Encoder class 2023-05-14 06:39:07 +00:00			`f0_predictor = utils.get_f0_predictor(f0p,sampling_rate=sampling_rate, hop_length=hop_length,device=None,threshold=0.05)`
Encoder OOP 2023-05-13 15:45:56 +00:00			`f0,uv = f0_predictor.compute_f0_uv(`
Updata F0 Predictor 2023-05-13 07:33:40 +00:00			`wav`
remove redundent spec_gen and fix related bug 2023-03-24 05:00:14 +00:00			`)`
Encoder OOP 2023-05-13 15:45:56 +00:00			`np.save(f0_path, np.asanyarray((f0,uv),dtype=object))`
并行执行预处理，处理速度或将提升，整理部分代码 (#230) * 使用多线程来进行预处理，速度或将大幅提升，使用方法为 --use_thread <线程数> * 并行执行预处理，处理速度或将提升，整理部分代码 * 修正kl_loss计算公式 * resample使用多进程，preprocess_hubert_f0使用旧的并行方式（尝试共享模型失败） 2023-06-19 19:38:13 +00:00

remove redundent spec_gen and fix related bug 2023-03-24 05:00:14 +00:00			`spec_path = filename.replace(".wav", ".spec.pt")`
			`if not os.path.exists(spec_path):`
			`# Process spectrogram`
			`# The following code can't be replaced by torch.FloatTensor(wav)`
			`# because load_wav_to_torch return a tensor that need to be normalized`

			`if sr != hps.data.sampling_rate:`
			`raise ValueError(`
			`"{} SR doesn't match target {} SR".format(`
			`sr, hps.data.sampling_rate`
			`)`
			`)`
并行执行预处理，处理速度或将提升，整理部分代码 (#230) * 使用多线程来进行预处理，速度或将大幅提升，使用方法为 --use_thread <线程数> * 并行执行预处理，处理速度或将提升，整理部分代码 * 修正kl_loss计算公式 * resample使用多进程，preprocess_hubert_f0使用旧的并行方式（尝试共享模型失败） 2023-06-19 19:38:13 +00:00
diff 2023-05-16 05:17:51 +00:00			`#audio_norm = audio / hps.data.max_wav_value`
并行执行预处理，处理速度或将提升，整理部分代码 (#230) * 使用多线程来进行预处理，速度或将大幅提升，使用方法为 --use_thread <线程数> * 并行执行预处理，处理速度或将提升，整理部分代码 * 修正kl_loss计算公式 * resample使用多进程，preprocess_hubert_f0使用旧的并行方式（尝试共享模型失败） 2023-06-19 19:38:13 +00:00
remove redundent spec_gen and fix related bug 2023-03-24 05:00:14 +00:00			`spec = spectrogram_torch(`
			`audio_norm,`
			`hps.data.filter_length,`
			`hps.data.sampling_rate,`
			`hps.data.hop_length,`
			`hps.data.win_length,`
			`center=False,`
			`)`
			`spec = torch.squeeze(spec, 0)`
			`torch.save(spec, spec_path)`

Updata vol emb 2023-05-28 13:47:32 +00:00			`if diff or hps.model.vol_embedding:`
diff 2023-05-16 05:17:51 +00:00			`volume_path = filename + ".vol.npy"`
			`volume_extractor = utils.Volume_Extractor(hop_length)`
			`if not os.path.exists(volume_path):`
			`volume = volume_extractor.extract(audio_norm)`
			`np.save(volume_path, volume.to('cpu').numpy())`
Updata vol emb 2023-05-28 13:47:32 +00:00
			`if diff:`
diff 2023-05-16 05:17:51 +00:00			`mel_path = filename + ".mel.npy"`
			`if not os.path.exists(mel_path) and mel_extractor is not None:`
			`mel_t = mel_extractor.extract(audio_norm.to(device), sampling_rate)`
			`mel = mel_t.squeeze().to('cpu').numpy()`
			`np.save(mel_path, mel)`
			`aug_mel_path = filename + ".aug_mel.npy"`
			`aug_vol_path = filename + ".aug_vol.npy"`
			`max_amp = float(torch.max(torch.abs(audio_norm))) + 1e-5`
			`max_shift = min(1, np.log10(1/max_amp))`
			`log10_vol_shift = random.uniform(-1, max_shift)`
			`keyshift = random.uniform(-5, 5)`
			`if mel_extractor is not None:`
			`aug_mel_t = mel_extractor.extract(audio_norm * (10 ** log10_vol_shift), sampling_rate, keyshift = keyshift)`
			`aug_mel = aug_mel_t.squeeze().to('cpu').numpy()`
			`aug_vol = volume_extractor.extract(audio_norm * (10 ** log10_vol_shift))`
			`if not os.path.exists(aug_mel_path):`
			`np.save(aug_mel_path,np.asanyarray((aug_mel,keyshift),dtype=object))`
			`if not os.path.exists(aug_vol_path):`
			`np.save(aug_vol_path,aug_vol.to('cpu').numpy())`

fix(preprocess): pass device 2023-07-23 14:12:04 +00:00
			`def process_batch(file_chunk, f0p, diff=False, mel_extractor=None, device="cpu"):`
Update preprocess_hubert_f0.py 2023-07-22 14:01:44 +00:00			`logger.info("Loading speech encoder for content...")`
Update preprocess_hubert_f0.py 2023-07-22 06:30:54 +00:00			`rank = mp.current_process()._identity`
			`rank = rank[0] if len(rank) > 0 else 0`
			`if torch.cuda.is_available():`
			`gpu_id = rank % torch.cuda.device_count()`
			`device = torch.device(f"cuda:{gpu_id}")`
Update preprocess_hubert_f0.py 2023-07-22 14:01:44 +00:00			`logger.info(f"Rank {rank} uses device {device}")`
并行执行预处理，处理速度或将提升，整理部分代码 (#230) * 使用多线程来进行预处理，速度或将大幅提升，使用方法为 --use_thread <线程数> * 并行执行预处理，处理速度或将提升，整理部分代码 * 修正kl_loss计算公式 * resample使用多进程，preprocess_hubert_f0使用旧的并行方式（尝试共享模型失败） 2023-06-19 19:38:13 +00:00			`hmodel = utils.get_speech_encoder(speech_encoder, device=device)`
Update preprocess_hubert_f0.py 2023-07-22 14:01:44 +00:00			`logger.info(f"Loaded speech encoder for rank {rank}")`
并行执行预处理，处理速度或将提升，整理部分代码 (#230) * 使用多线程来进行预处理，速度或将大幅提升，使用方法为 --use_thread <线程数> * 并行执行预处理，处理速度或将提升，整理部分代码 * 修正kl_loss计算公式 * resample使用多进程，preprocess_hubert_f0使用旧的并行方式（尝试共享模型失败） 2023-06-19 19:38:13 +00:00			`for filename in tqdm(file_chunk):`
Debug rank GPU 2023-07-23 01:43:00 +00:00			`process_one(filename, hmodel, f0p, gpu_id, diff, mel_extractor)`
并行执行预处理，处理速度或将提升，整理部分代码 (#230) * 使用多线程来进行预处理，速度或将大幅提升，使用方法为 --use_thread <线程数> * 并行执行预处理，处理速度或将提升，整理部分代码 * 修正kl_loss计算公式 * resample使用多进程，preprocess_hubert_f0使用旧的并行方式（尝试共享模型失败） 2023-06-19 19:38:13 +00:00
fix(preprocess): pass device 2023-07-23 14:12:04 +00:00			`def parallel_process(filenames, num_processes, f0p, diff, mel_extractor, device):`
并行执行预处理，处理速度或将提升，整理部分代码 (#230) * 使用多线程来进行预处理，速度或将大幅提升，使用方法为 --use_thread <线程数> * 并行执行预处理，处理速度或将提升，整理部分代码 * 修正kl_loss计算公式 * resample使用多进程，preprocess_hubert_f0使用旧的并行方式（尝试共享模型失败） 2023-06-19 19:38:13 +00:00			`with ProcessPoolExecutor(max_workers=num_processes) as executor:`
			`tasks = []`
			`for i in range(num_processes):`
			`start = int(i * len(filenames) / num_processes)`
			`end = int((i + 1) * len(filenames) / num_processes)`
			`file_chunk = filenames[start:end]`
fix(preprocess): pass device 2023-07-23 14:12:04 +00:00			`tasks.append(executor.submit(process_batch, file_chunk, f0p, diff, mel_extractor, device=device))`
并行执行预处理，处理速度或将提升，整理部分代码 (#230) * 使用多线程来进行预处理，速度或将大幅提升，使用方法为 --use_thread <线程数> * 并行执行预处理，处理速度或将提升，整理部分代码 * 修正kl_loss计算公式 * resample使用多进程，preprocess_hubert_f0使用旧的并行方式（尝试共享模型失败） 2023-06-19 19:38:13 +00:00			`for task in tqdm(tasks):`
			`task.result()`
upload code 2023-03-10 10:11:04 +00:00
			`if __name__ == "__main__":`
			`parser = argparse.ArgumentParser()`
fix(preprocess): pass device 2023-07-23 14:12:04 +00:00			`parser.add_argument('-d', '--device', type=str, default=None)`
remove redundent spec_gen and fix related bug 2023-03-24 05:00:14 +00:00			`parser.add_argument(`
			`"--in_dir", type=str, default="dataset/44k", help="path to input dir"`
			`)`
并行执行预处理，处理速度或将提升，整理部分代码 (#230) * 使用多线程来进行预处理，速度或将大幅提升，使用方法为 --use_thread <线程数> * 并行执行预处理，处理速度或将提升，整理部分代码 * 修正kl_loss计算公式 * resample使用多进程，preprocess_hubert_f0使用旧的并行方式（尝试共享模型失败） 2023-06-19 19:38:13 +00:00			`parser.add_argument(`
diff 2023-05-16 05:17:51 +00:00			`'--use_diff',action='store_true', help='Whether to use the diffusion model'`
Updata Encoder class 2023-05-14 06:39:07 +00:00			`)`
并行执行预处理，处理速度或将提升，整理部分代码 (#230) * 使用多线程来进行预处理，速度或将大幅提升，使用方法为 --use_thread <线程数> * 并行执行预处理，处理速度或将提升，整理部分代码 * 修正kl_loss计算公式 * resample使用多进程，preprocess_hubert_f0使用旧的并行方式（尝试共享模型失败） 2023-06-19 19:38:13 +00:00			`parser.add_argument(`
Updata FCPE 2023-07-22 16:25:03 +00:00			`'--f0_predictor', type=str, default="dio", help='Select F0 predictor, can select crepe,pm,dio,harvest,rmvpe,fcpe\|default: pm(note: crepe is original F0 using mean filter)'`
difi 2023-05-14 17:23:46 +00:00			`)`
并行执行预处理，处理速度或将提升，整理部分代码 (#230) * 使用多线程来进行预处理，速度或将大幅提升，使用方法为 --use_thread <线程数> * 并行执行预处理，处理速度或将提升，整理部分代码 * 修正kl_loss计算公式 * resample使用多进程，preprocess_hubert_f0使用旧的并行方式（尝试共享模型失败） 2023-06-19 19:38:13 +00:00			`parser.add_argument(`
Updata Preprocess multiprocessing/thread 2023-05-30 18:12:46 +00:00			`'--num_processes', type=int, default=1, help='You are advised to set the number of processes to the same as the number of CPU cores'`
			`)`
upload code 2023-03-10 10:11:04 +00:00			`args = parser.parse_args()`
Updata Encoder class 2023-05-14 06:39:07 +00:00			`f0p = args.f0_predictor`
fix(preprocess): pass device 2023-07-23 14:12:04 +00:00			`device = args.device`
			`if device is None:`
			`device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")`

Updata Encoder class 2023-05-14 06:39:07 +00:00			`print(speech_encoder)`
Merge branch '4.1-Stable' into 4.1-Latest 2023-07-23 15:05:02 +00:00			`logger.info("Using device: ", device)`
			`logger.info("Using SpeechEncoder: " + speech_encoder)`
			`logger.info("Using extractor: " + f0p)`
			`logger.info("Using diff Mode: " + str( args.use_diff))`

diff 2023-05-16 05:17:51 +00:00			`if args.use_diff:`
			`print("use_diff")`
			`print("Loading Mel Extractor...")`
fix(preprocess): pass device 2023-07-23 14:12:04 +00:00			`mel_extractor = Vocoder(dconfig.vocoder.type, dconfig.vocoder.ckpt, device=device)`
diff 2023-05-16 05:17:51 +00:00			`print("Loaded Mel Extractor.")`
			`else:`
			`mel_extractor = None`
remove redundent spec_gen and fix related bug 2023-03-24 05:00:14 +00:00			`filenames = glob(f"{args.in_dir}//.wav", recursive=True) # [:10]`
upload code 2023-03-10 10:11:04 +00:00			`shuffle(filenames)`
Update preprocess_hubert_f0.py 2023-07-22 06:30:54 +00:00			`mp.set_start_method("spawn", force=True)`
并行执行预处理，处理速度或将提升，整理部分代码 (#230) * 使用多线程来进行预处理，速度或将大幅提升，使用方法为 --use_thread <线程数> * 并行执行预处理，处理速度或将提升，整理部分代码 * 修正kl_loss计算公式 * resample使用多进程，preprocess_hubert_f0使用旧的并行方式（尝试共享模型失败） 2023-06-19 19:38:13 +00:00
Updata Preprocess multiprocessing/thread 2023-05-30 18:12:46 +00:00			`num_processes = args.num_processes`
并行执行预处理，处理速度或将提升，整理部分代码 (#230) * 使用多线程来进行预处理，速度或将大幅提升，使用方法为 --use_thread <线程数> * 并行执行预处理，处理速度或将提升，整理部分代码 * 修正kl_loss计算公式 * resample使用多进程，preprocess_hubert_f0使用旧的并行方式（尝试共享模型失败） 2023-06-19 19:38:13 +00:00			`if num_processes == 0:`
			`num_processes = os.cpu_count()`
fix(preprocess): pass device 2023-07-23 14:12:04 +00:00
			`parallel_process(filenames, num_processes, f0p, args.use_diff, mel_extractor, device)`