1 min voice data can also be used to train a good TTS model! (few shot voice cloning)
273 matches across 14 categories. Click a row to expand file-level details.
| Severity | File | Line | Snippet |
|---|---|---|---|
| LOW | webui.py | 167 | def check_pretrained_is_exist(version): |
| LOW | api.py | 494 | def change_gpt_sovits_weights(gpt_path, sovits_path): |
| LOW | tools/uvr5/lib/lib_v5/spec_utils.py | 139 | def reduce_vocal_aggressively(X, y, softmask): |
| LOW | GPT_SoVITS/process_ckpt.py | 100 | def get_sovits_version_from_path_fast(sovits_path): |
| LOW | GPT_SoVITS/inference_webui.py | 751 | def merge_short_text_in_array(texts, threshold): |
| LOW | GPT_SoVITS/export_torch_script.py | 107 | def multinomial_sample_one_no_sync(probs_sort): |
| LOW | GPT_SoVITS/export_torch_script.py | 554 | def build_phone_level_feature(res: Tensor, word2ph: IntTensor): |
| LOW | GPT_SoVITS/utils.py | 120 | def plot_spectrogram_to_numpy(spectrogram): |
| LOW | GPT_SoVITS/stream_v2pro.py | 188 | def find_best_audio_offset_fast(reference_audio: Tensor, search_audio: Tensor): |
| LOW | GPT_SoVITS/eres2net/kaldi.py | 125 | def _get_waveform_and_window_properties( |
| LOW | GPT_SoVITS/module/mel_processing.py | 8 | def dynamic_range_compression_torch(x, C=1, clip_val=1e-5): |
| LOW | GPT_SoVITS/module/mel_processing.py | 17 | def dynamic_range_decompression_torch(x, C=1): |
| LOW | GPT_SoVITS/module/mel_processing.py | 31 | def spectral_de_normalize_torch(magnitudes): |
| LOW | GPT_SoVITS/module/transforms.py | 12 | def piecewise_rational_quadratic_transform( |
| LOW | GPT_SoVITS/module/transforms.py | 50 | def unconstrained_rational_quadratic_spline( |
| LOW | GPT_SoVITS/module/transforms.py | 100 | def rational_quadratic_spline( |
| LOW | GPT_SoVITS/module/mrte_model.py | 158 | def fused_add_tanh_sigmoid_multiply(input, n_channels): |
| LOW | GPT_SoVITS/module/attentions.py | 260 | def _matmul_with_relative_values(self, x, y): |
| LOW | GPT_SoVITS/module/attentions.py | 269 | def _matmul_with_relative_keys(self, x, y): |
| LOW | GPT_SoVITS/module/attentions.py | 294 | def _relative_position_to_absolute_position(self, x): |
| LOW | GPT_SoVITS/module/attentions.py | 311 | def _absolute_position_to_relative_position(self, x): |
| LOW | GPT_SoVITS/module/attentions.py | 507 | def remove_weight_norm_modules(module, name="weight"): |
| LOW | GPT_SoVITS/module/data_utils.py | 109 | def get_audio_text_speaker_pair(self, audiopath_sid_text): |
| LOW | GPT_SoVITS/module/data_utils.py | 375 | def get_audio_text_speaker_pair(self, audiopath_sid_text): |
| LOW | GPT_SoVITS/module/data_utils.py | 613 | def get_audio_text_speaker_pair(self, audiopath_sid_text): |
| LOW | GPT_SoVITS/module/data_utils.py | 824 | def get_audio_text_speaker_pair(self, audiopath_sid_text): |
| LOW | GPT_SoVITS/module/commons.py | 97 | def fused_add_tanh_sigmoid_multiply(input_a, input_b, n_channels): |
| LOW | GPT_SoVITS/module/attentions_onnx.py | 27 | def fused_add_tanh_sigmoid_multiply(input_a, input_b, n_channels): |
| LOW | GPT_SoVITS/module/attentions_onnx.py | 223 | def _matmul_with_relative_values(self, x, y): |
| LOW | GPT_SoVITS/module/attentions_onnx.py | 232 | def _matmul_with_relative_keys(self, x, y): |
| LOW | GPT_SoVITS/module/attentions_onnx.py | 257 | def _relative_position_to_absolute_position(self, x): |
| LOW | GPT_SoVITS/module/attentions_onnx.py | 274 | def _absolute_position_to_relative_position(self, x): |
| LOW | GPT_SoVITS/TTS_infer_pack/TTS.py | 1665 | def using_vocoder_synthesis_batched_infer( |
| LOW | GPT_SoVITS/TTS_infer_pack/TextPreprocessor.py | 34 | def merge_short_text_in_array(texts: str, threshold: int) -> list: |
| LOW | GPT_SoVITS/TTS_infer_pack/TextPreprocessor.py | 117 | def segment_and_extract_feature_for_text( |
| LOW | GPT_SoVITS/TTS_infer_pack/TextPreprocessor.py | 235 | def replace_consecutive_punctuation(self, text): |
| LOW | GPT_SoVITS/BigVGAN/meldataset.py | 23 | def dynamic_range_compression(x, C=1, clip_val=1e-5): |
| LOW | GPT_SoVITS/BigVGAN/meldataset.py | 27 | def dynamic_range_decompression(x, C=1): |
| LOW | GPT_SoVITS/BigVGAN/meldataset.py | 31 | def dynamic_range_compression_torch(x, C=1, clip_val=1e-5): |
| LOW | GPT_SoVITS/BigVGAN/meldataset.py | 35 | def dynamic_range_decompression_torch(x, C=1): |
| LOW | GPT_SoVITS/BigVGAN/meldataset.py | 43 | def spectral_de_normalize_torch(magnitudes): |
| LOW | GPT_SoVITS/BigVGAN/alias_free_activation/cuda/load.py | 31 | def _cpp_extention_load_helper(name, sources, extra_cuda_flags): |
| LOW | GPT_SoVITS/BigVGAN/alias_free_activation/cuda/load.py | 66 | def _get_cuda_bare_metal_version(cuda_dir): |
| LOW | GPT_SoVITS/BigVGAN/tests/test_activation.py | 24 | def test_anti_alias_activation(): |
| LOW | GPT_SoVITS/BigVGAN/tests/test_activation_snake_beta.py | 24 | def test_anti_alias_activation(): |
| LOW | GPT_SoVITS/f5_tts/model/modules.py | 30 | def get_bigvgan_mel_spectrogram( |
| LOW | GPT_SoVITS/f5_tts/model/modules.py | 75 | def get_vocos_mel_spectrogram( |
| LOW | GPT_SoVITS/AR/models/t2s_model_onnx.py | 74 | def multinomial_sample_one_no_sync( |
| LOW | GPT_SoVITS/AR/models/utils.py | 140 | def multinomial_sample_one_no_sync( |
| LOW | GPT_SoVITS/AR/models/t2s_model.py | 39 | def scaled_dot_product_attention( |
| LOW | GPT_SoVITS/AR/models/t2s_model.py | 783 | def infer_panel_naive_batched( |
| LOW | GPT_SoVITS/AR/modules/patched_mha_with_cache_onnx.py | 7 | def multi_head_attention_forward_patched( |
| LOW | GPT_SoVITS/AR/modules/patched_mha_with_cache.py | 13 | def multi_head_attention_forward_patched( |
| LOW | GPT_SoVITS/AR/modules/optim.py | 363 | def _show_gradient_dominating_parameter(self, tuples: List[Tuple[Tensor, dict, List[str]]], tot_sumsq: Tensor): |
| LOW | GPT_SoVITS/text/chinese2.py | 305 | def replace_punctuation_with_en(text): |
| LOW | GPT_SoVITS/text/chinese2.py | 316 | def replace_consecutive_punctuation(text): |
| LOW | GPT_SoVITS/text/cantonese.py | 118 | def jyuping_to_initials_finals_tones(jyuping_syllables): |
| LOW | GPT_SoVITS/text/japanese.py | 138 | def replace_consecutive_punctuation(text): |
| LOW | GPT_SoVITS/text/japanese.py | 260 | def _numeric_feature_by_regex(regex, s): |
| LOW | GPT_SoVITS/text/english.py | 124 | def replace_consecutive_punctuation(text): |
| 10 more matches not shown… | |||
| Severity | File | Line | Snippet |
|---|---|---|---|
| HIGH | GPT_SoVITS/module/data_utils.py | 0 | 1) loads audio, speaker_id, text pairs 2) normalizes text and converts them to sequences of integers 3) computes spectro |
| HIGH | GPT_SoVITS/module/data_utils.py | 0 | 1) loads audio, speaker_id, text pairs 2) normalizes text and converts them to sequences of integers 3) computes spectro |
| HIGH | GPT_SoVITS/module/data_utils.py | 0 | 1) loads audio, speaker_id, text pairs 2) normalizes text and converts them to sequences of integers 3) computes spectro |
| HIGH | GPT_SoVITS/module/data_utils.py | 0 | 1) loads audio, speaker_id, text pairs 2) normalizes text and converts them to sequences of integers 3) computes spectro |
| HIGH | GPT_SoVITS/module/data_utils.py | 0 | collate's training batch from normalized text, audio and speaker identities params ------ batch: [text_normalized, spec_ |
| HIGH | GPT_SoVITS/module/data_utils.py | 0 | collate's training batch from normalized text, audio and speaker identities params ------ batch: [text_normalized, spec_ |
| HIGH | GPT_SoVITS/module/data_utils.py | 0 | collate's training batch from normalized text, audio and speaker identities params ------ batch: [text_normalized, spec_ |
| HIGH | GPT_SoVITS/module/data_utils.py | 0 | collate's training batch from normalized text, audio and speaker identities params ------ batch: [text_normalized, spec_ |
| HIGH | GPT_SoVITS/f5_tts/model/modules.py | 0 | ein notation: b - batch n - sequence nt - text sequence nw - raw wave length d - dimension |
| HIGH | GPT_SoVITS/f5_tts/model/backbones/mmdit.py | 0 | ein notation: b - batch n - sequence nt - text sequence nw - raw wave length d - dimension |
| HIGH | GPT_SoVITS/f5_tts/model/backbones/unett.py | 0 | ein notation: b - batch n - sequence nt - text sequence nw - raw wave length d - dimension |
| HIGH | GPT_SoVITS/f5_tts/model/backbones/dit.py | 0 | ein notation: b - batch n - sequence nt - text sequence nw - raw wave length d - dimension |
| Severity | File | Line | Snippet |
|---|---|---|---|
| LOW | api_v2.py | 345 | |
| LOW | webui.py | 244 | |
| LOW | webui.py | 1046 | |
| LOW | api.py | 545 | |
| LOW | api.py | 830 | |
| LOW | tools/slicer2.py | 67 | |
| LOW | tools/slice_audio.py | 13 | |
| LOW | tools/my_utils.py | 49 | |
| LOW | tools/my_utils.py | 140 | |
| LOW | tools/my_utils.py | 187 | |
| LOW | tools/uvr5/webui.py | 45 | |
| LOW | tools/uvr5/vr.py | 45 | |
| LOW | tools/uvr5/vr.py | 217 | |
| LOW | tools/uvr5/mdxnet.py | 172 | |
| LOW | tools/uvr5/bsroformer.py | 111 | |
| LOW | tools/uvr5/lib/utils.py | 94 | |
| LOW | tools/asr/fasterwhisper_asr.py | 104 | |
| LOW | tools/i18n/scan_i18n.py | 29 | |
| LOW | GPT_SoVITS/s1_train.py | 46 | |
| LOW | GPT_SoVITS/inference_webui.py | 640 | |
| LOW | GPT_SoVITS/inference_webui.py | 790 | |
| LOW | GPT_SoVITS/s2_train_v3_lora.py | 263 | |
| LOW | GPT_SoVITS/s2_train.py | 318 | |
| LOW | GPT_SoVITS/stream_v2pro.py | 240 | |
| LOW | GPT_SoVITS/eres2net/kaldi.py | 86 | |
| LOW | GPT_SoVITS/module/mrte_model.py | 25 | |
| LOW | GPT_SoVITS/module/ddp_utils.py | 58 | |
| LOW | GPT_SoVITS/TTS_infer_pack/TTS.py | 856 | |
| LOW | GPT_SoVITS/TTS_infer_pack/TTS.py | 998 | |
| LOW | GPT_SoVITS/TTS_infer_pack/TextPreprocessor.py | 122 | |
| LOW | GPT_SoVITS/BigVGAN/train.py | 56 | |
| LOW | GPT_SoVITS/BigVGAN/train.py | 265 | |
| LOW | GPT_SoVITS/BigVGAN/meldataset.py | 222 | |
| LOW | GPT_SoVITS/f5_tts/model/backbones/unett.py | 164 | |
| LOW | GPT_SoVITS/AR/utils/initialize.py | 8 | |
| LOW | GPT_SoVITS/AR/models/t2s_model_cudagraph.py | 458 | |
| LOW | GPT_SoVITS/AR/models/t2s_model.py | 583 | |
| LOW | GPT_SoVITS/AR/modules/patched_mha_with_cache.py | 13 | |
| LOW | GPT_SoVITS/AR/modules/activation.py | 204 | |
| LOW | GPT_SoVITS/AR/modules/optim.py | 197 | |
| LOW | GPT_SoVITS/text/chinese2.py | 180 | |
| LOW | GPT_SoVITS/text/cantonese.py | 118 | |
| LOW | GPT_SoVITS/text/cantonese.py | 176 | |
| LOW | GPT_SoVITS/text/japanese.py | 183 | |
| LOW | GPT_SoVITS/text/english.py | 131 | |
| LOW | GPT_SoVITS/text/english.py | 155 | |
| LOW | GPT_SoVITS/text/english.py | 270 | |
| LOW | GPT_SoVITS/text/english.py | 309 | |
| LOW | GPT_SoVITS/text/tone_sandhi.py | 495 | |
| LOW | GPT_SoVITS/text/tone_sandhi.py | 550 | |
| LOW | GPT_SoVITS/text/tone_sandhi.py | 586 | |
| LOW | GPT_SoVITS/text/chinese.py | 94 | |
| LOW | GPT_SoVITS/text/korean.py | 183 | |
| LOW | GPT_SoVITS/text/korean.py | 15 | |
| LOW | GPT_SoVITS/text/en_normalization/expend.py | 226 | |
| LOW | GPT_SoVITS/text/g2pw/onnx_api.py | 74 | |
| LOW | GPT_SoVITS/text/g2pw/onnx_api.py | 248 | |
| LOW | GPT_SoVITS/text/g2pw/utils.py | 132 | |
| LOW | GPT_SoVITS/text/LangSegmenter/langsegmenter.py | 90 |
| Severity | File | Line | Snippet |
|---|---|---|---|
| LOW | api_v2.py | 444 | except Exception as e: |
| LOW | api_v2.py | 521 | except Exception as e: |
| LOW | api_v2.py | 551 | except Exception as e: |
| LOW | api_v2.py | 563 | except Exception as e: |
| LOW | api_v2.py | 573 | except Exception: |
| LOW | webui.py | 32 | except Exception as e: |
| LOW | api.py | 498 | except Exception as e: |
| LOW | api.py | 901 | except Exception as e: |
| MEDIUM | api.py | 494 | def change_gpt_sovits_weights(gpt_path, sovits_path): |
| LOW | tools/my_utils.py | 29 | except Exception: |
| MEDIUM | tools/my_utils.py | 16 | def load_audio(file, sr): |
| MEDIUM | tools/uvr5/bsroformer.py | 107 | print("Error: Unknown model: {}".format(self.model_type)) |
| LOW | tools/uvr5/bsroformer.py | 212 | except Exception as e: |
| MEDIUM | tools/uvr5/bsroformer.py | 214 | print("Error message: {}".format(str(e))) |
| LOW | tools/asr/funasr_asr.py | 18 | except Exception: |
| LOW | tools/asr/funasr_asr.py | 87 | except Exception: |
| MEDIUM | tools/asr/funasr_asr.py | 14 | def only_asr(input_file, language): |
| LOW | tools/asr/fasterwhisper_asr.py | 47 | except Exception: |
| LOW | tools/asr/fasterwhisper_asr.py | 137 | except Exception as e: |
| LOW | tools/i18n/scan_i18n.py | 48 | except Exception as e: |
| LOW | GPT_SoVITS/s1_train.py | 144 | except Exception: |
| LOW | GPT_SoVITS/inference_webui.py | 165 | except Exception as e: |
| LOW | GPT_SoVITS/module/data_utils.py | 83 | except Exception: |
| LOW | GPT_SoVITS/module/data_utils.py | 337 | except Exception: |
| LOW | GPT_SoVITS/module/data_utils.py | 575 | except Exception: |
| LOW | GPT_SoVITS/module/data_utils.py | 786 | except Exception: |
| LOW | GPT_SoVITS/TTS_infer_pack/TTS.py | 1516 | except Exception as e: |
| MEDIUM | GPT_SoVITS/TTS_infer_pack/TTS.py | 126 | def __getattr__(self, item): |
| LOW | GPT_SoVITS/BigVGAN/meldataset.py | 362 | except Exception as e: |
| LOW | GPT_SoVITS/AR/utils/__init__.py | 34 | except Exception: |
| MEDIUM | GPT_SoVITS/AR/utils/__init__.py | 28 | def check_txt_file(file_path): |
| LOW | GPT_SoVITS/AR/models/t2s_model_cudagraph.py | 584 | except Exception as e: |
| LOW | GPT_SoVITS/AR/data/dataset.py | 134 | except Exception: |
| LOW | GPT_SoVITS/text/japanese.py | 72 | except Exception: |
| LOW | GPT_SoVITS/text/g2pw/onnx_api.py | 24 | except Exception: |
| LOW | GPT_SoVITS/text/g2pw/dataset.py | 75 | except Exception: |
| Severity | File | Line | Snippet |
|---|---|---|---|
| LOW | api_v2.py | 181 | def pack_ogg(io_buffer: BytesIO, data: np.ndarray, rate: int): |
| LOW | api_v2.py | 521 | except Exception as e: |
| LOW | api.py | 681 | |
| LOW | GPT_SoVITS/inference_webui.py | 1401 | sample_steps, |
| LOW | GPT_SoVITS/export_torch_script_v3v4.py | 681 | estimator: ExportDiT = torch.jit.trace( |
| LOW | GPT_SoVITS/export_torch_script_v3v4.py | 881 | ) |
| LOW | GPT_SoVITS/export_torch_script_v3v4.py | 1161 | # vq_model = torch.jit.optimize_for_inference(vq_model) |
| LOW | GPT_SoVITS/export_torch_script.py | 941 | # bert_model = AutoModelForMaskedLM.from_pretrained(bert_path,output_hidden_states=True,torchscript=True) |
| LOW | GPT_SoVITS/s2_train_v3.py | 161 | ) |
| LOW | GPT_SoVITS/s2_train_v3.py | 221 | # torch.load(hps.train.pretrained_s2D, map_location="cpu")["weight"] |
| LOW | GPT_SoVITS/s2_train_v3.py | 381 | # "slice/mel_gen": utils.plot_spectrogram_to_numpy(y_hat_mel[0].data.cpu().numpy()), |
| LOW | GPT_SoVITS/module/attentions_onnx.py | 101 | # x = x * x_mask |
| LOW | GPT_SoVITS/module/core_vq.py | 1 | # Copyright (c) Meta Platforms, Inc. and affiliates. |
| LOW | GPT_SoVITS/TTS_infer_pack/TTS.py | 281 | "v2Pro": 486, |
| LOW | GPT_SoVITS/TTS_infer_pack/TTS.py | 941 | # phones_batch = self.batch_sequences(phones_list, axis=0, pad_value=0, max_length=max_len) |
| LOW | GPT_SoVITS/TTS_infer_pack/TTS.py | 1281 | t4 = time.perf_counter() |
| LOW | GPT_SoVITS/BigVGAN/alias_free_activation/cuda/compat.h | 21 | #ifndef TORCH_CHECK |
| LOW | GPT_SoVITS/f5_tts/model/__init__.py | 1 | # from f5_tts.model.cfm import CFM |
| LOW | GPT_SoVITS/AR/models/t2s_lightning_module.py | 81 | ) |
| LOW | GPT_SoVITS/AR/models/t2s_lightning_module.py | 101 | # f"val_top_{self.top_k}_acc", |
| LOW | GPT_SoVITS/AR/models/t2s_model.py | 661 | value=False, |
| LOW | GPT_SoVITS/AR/models/t2s_model.py | 681 | |
| LOW | GPT_SoVITS/AR/modules/scaling.py | 1 | # Copyright 2022 Xiaomi Corp. (authors: Daniel Povey) |
| LOW | GPT_SoVITS/AR/modules/optim.py | 1 | # Copyright 2022 Xiaomi Corp. (authors: Daniel Povey) |
| LOW | GPT_SoVITS/AR/data/dataset.py | 321 | # print('batch["phoneme_ids_len"]:', batch["phoneme_ids_len"], |
| LOW | GPT_SoVITS/text/tone_sandhi.py | 1 | # Copyright (c) 2021 PaddlePaddle Authors. All Rights Reserved. |
| LOW | GPT_SoVITS/text/korean.py | 61 | # This is a list of Korean classifiers preceded by pure Korean numerals. |
| LOW | GPT_SoVITS/text/g2pw/dataset.py | 1 | # Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved. |
| LOW | GPT_SoVITS/text/g2pw/utils.py | 1 | # Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved. |
| LOW | GPT_SoVITS/text/zh_normalization/num.py | 1 | # Copyright (c) 2021 PaddlePaddle Authors. All Rights Reserved. |
| LOW | GPT_SoVITS/text/zh_normalization/constants.py | 1 | # Copyright (c) 2021 PaddlePaddle Authors. All Rights Reserved. |
| LOW | GPT_SoVITS/text/zh_normalization/__init__.py | 1 | # Copyright (c) 2020 PaddlePaddle Authors. All Rights Reserved. |
| LOW | GPT_SoVITS/text/zh_normalization/char_convert.py | 1 | # coding=utf-8 |
| LOW | GPT_SoVITS/text/zh_normalization/chronology.py | 1 | # Copyright (c) 2021 PaddlePaddle Authors. All Rights Reserved. |
| LOW | GPT_SoVITS/text/zh_normalization/phonecode.py | 1 | # Copyright (c) 2021 PaddlePaddle Authors. All Rights Reserved. |
| LOW | GPT_SoVITS/text/zh_normalization/text_normlization.py | 1 | # Copyright (c) 2021 PaddlePaddle Authors. All Rights Reserved. |
| LOW | GPT_SoVITS/text/zh_normalization/quantifier.py | 1 | # Copyright (c) 2021 PaddlePaddle Authors. All Rights Reserved. |
| LOW | GPT_SoVITS/feature_extractor/cnhubert.py | 41 | # def __init__(self): |
| LOW | GPT_SoVITS/feature_extractor/cnhubert.py | 61 | # def __init__(self): |
| Severity | File | Line | Snippet |
|---|---|---|---|
| LOW | api.py | 542 | |
| LOW | tools/audio_sr.py | 1 | |
| LOW | tools/audio_sr.py | 1 | |
| LOW | tools/audio_sr.py | 1 | |
| LOW | tools/audio_sr.py | 1 | |
| LOW | GPT_SoVITS/inference_webui.py | 637 | |
| LOW | GPT_SoVITS/module/core_vq.py | 36 | |
| LOW | GPT_SoVITS/TTS_infer_pack/__init__.py | 1 | |
| LOW | GPT_SoVITS/TTS_infer_pack/__init__.py | 1 | |
| LOW | GPT_SoVITS/TTS_infer_pack/TextPreprocessor.py | 13 | |
| LOW | GPT_SoVITS/BigVGAN/inference_e2e.py | 4 | |
| LOW | GPT_SoVITS/BigVGAN/inference_e2e.py | 4 | |
| LOW | GPT_SoVITS/BigVGAN/inference_e2e.py | 4 | |
| LOW | GPT_SoVITS/BigVGAN/inference_e2e.py | 4 | |
| LOW | GPT_SoVITS/BigVGAN/inference.py | 4 | |
| LOW | GPT_SoVITS/BigVGAN/inference.py | 4 | |
| LOW | GPT_SoVITS/BigVGAN/inference.py | 4 | |
| LOW | GPT_SoVITS/BigVGAN/inference.py | 4 | |
| LOW | …SoVITS/BigVGAN/alias_free_activation/torch/__init__.py | 4 | |
| LOW | …SoVITS/BigVGAN/alias_free_activation/torch/__init__.py | 5 | |
| LOW | …SoVITS/BigVGAN/alias_free_activation/torch/__init__.py | 6 | |
| LOW | GPT_SoVITS/f5_tts/model/__init__.py | 4 | |
| LOW | GPT_SoVITS/f5_tts/model/modules.py | 10 | |
| LOW | GPT_SoVITS/f5_tts/model/backbones/mmdit.py | 10 | |
| LOW | GPT_SoVITS/f5_tts/model/backbones/unett.py | 10 | |
| LOW | GPT_SoVITS/f5_tts/model/backbones/dit.py | 10 | |
| LOW | GPT_SoVITS/AR/models/structs_cudagraph.py | 1 | |
| LOW | GPT_SoVITS/AR/models/t2s_model_cudagraph.py | 7 | |
| LOW | GPT_SoVITS/AR/models/t2s_model_cudagraph.py | 9 | |
| LOW | GPT_SoVITS/AR/models/t2s_model_cudagraph.py | 12 | |
| LOW | GPT_SoVITS/AR/models/t2s_model_cudagraph.py | 12 | |
| LOW | GPT_SoVITS/AR/modules/patched_mha_with_cache_onnx.py | 1 | |
| LOW | GPT_SoVITS/AR/modules/patched_mha_with_cache.py | 1 | |
| LOW | GPT_SoVITS/text/en_normalization/expend.py | 3 | |
| LOW | GPT_SoVITS/text/g2pw/__init__.py | 1 | |
| LOW | GPT_SoVITS/text/LangSegmenter/__init__.py | 1 | |
| LOW | GPT_SoVITS/text/zh_normalization/__init__.py | 14 |
| Severity | File | Line | Snippet |
|---|---|---|---|
| MEDIUM | api.py | 1155 | # -------------------------------- |
| MEDIUM | api.py | 1157 | # -------------------------------- |
| MEDIUM | api.py | 1295 | # -------------------------------- |
| MEDIUM | api.py | 1297 | # -------------------------------- |
| MEDIUM | GPT_SoVITS/AR/models/t2s_model_cudagraph.py | 74 | # ─── KV Cache ────────────────────���─────────────────────────────────────────── |
| MEDIUM | GPT_SoVITS/AR/models/t2s_model_cudagraph.py | 117 | # ─── Attention (PyTorch native SDPA, no flash_attn) ───────────────────────── |
| MEDIUM | GPT_SoVITS/AR/models/t2s_model_cudagraph.py | 185 | # ─── Feed Forward ──────────────────────────────────────────────────────────── |
| MEDIUM | GPT_SoVITS/AR/models/t2s_model_cudagraph.py | 201 | # ─── Transformer Block ────────────────────────────────────────────────────── |
| MEDIUM | GPT_SoVITS/AR/models/t2s_model_cudagraph.py | 243 | # ─── Transformer Decoder ──────────────────────────────────────────────────── |
| MEDIUM | GPT_SoVITS/AR/models/t2s_model_cudagraph.py | 291 | # ─── T2S Decoder ───────────────────────────────────────────────────────────── |
| MEDIUM | GPT_SoVITS/AR/models/t2s_model_cudagraph.py | 433 | # ─── CUDA Graph Runner ─────────────────────────────────────────────────────── |
| Severity | File | Line | Snippet |
|---|---|---|---|
| HIGH | tools/assets.py | 7 | const newUrl = `${window.location.pathname}?${params.toString()}`; |
| Severity | File | Line | Snippet |
|---|---|---|---|
| HIGH | GPT_SoVITS/text/japanese.py | 184 | Extract phoneme + prosoody symbol sequence from input full-context labels. The algorithm is based on `Prosodic feat |
| Severity | File | Line | Snippet |
|---|---|---|---|
| MEDIUM | tools/slicer2.py | 4 | # This function is obtained from librosa. |
| Severity | File | Line | Snippet |
|---|---|---|---|
| LOW | GPT_SoVITS/BigVGAN/alias_free_activation/cuda/load.py | 18 | # Check if cuda 11 is installed for compute capability 8.0 |
| LOW | GPT_SoVITS/BigVGAN/tests/test_cuda_vs_torch_model.py | 175 | # Print results |
| Severity | File | Line | Snippet |
|---|---|---|---|
| MEDIUM | …ITS/BigVGAN/alias_free_activation/cuda/activation1d.py | 30 |
| Severity | File | Line | Snippet |
|---|---|---|---|
| LOW | GPT_SoVITS/AR/modules/optim.py | 462 | # For parameters with 1 element we just use regular Adam. |
| Severity | File | Line | Snippet |
|---|---|---|---|
| LOW | GPT_SoVITS/AR/modules/activation.py | 274 | # When lifting this restriction, don't forget to either |
| LOW | GPT_SoVITS/AR/modules/activation.py | 274 | # When lifting this restriction, don't forget to either |