wetdog commited on
Commit
9dc5ce7
1 Parent(s): bea1338

add vocos config to hub

Browse files
Files changed (3) hide show
  1. Dockerfile +2 -0
  2. config_22khz.yaml +0 -24
  3. infer_onnx.py +1 -1
Dockerfile CHANGED
@@ -44,6 +44,8 @@ RUN huggingface-cli download BSC-LT/matcha-tts-cat-onnx matcha_multispeaker_cat_
44
 
45
  RUN huggingface-cli download BSC-LT/vocos-mel-22khz-onnx mel_spec_22khz_v2.onnx --local-dir $HOME/app/
46
 
 
 
47
  COPY --chown=user . $HOME/app/
48
 
49
  # Fix ownership issues
 
44
 
45
  RUN huggingface-cli download BSC-LT/vocos-mel-22khz-onnx mel_spec_22khz_v2.onnx --local-dir $HOME/app/
46
 
47
+ RUN huggingface-cli download BSC-LT/vocos-mel-22khz-onnx config.yaml --local-dir $HOME/app/
48
+
49
  COPY --chown=user . $HOME/app/
50
 
51
  # Fix ownership issues
config_22khz.yaml DELETED
@@ -1,24 +0,0 @@
1
- feature_extractor:
2
- class_path: vocos.feature_extractors.MelSpectrogramFeatures
3
- init_args:
4
- sample_rate: 22050
5
- n_fft: 1024
6
- hop_length: 256
7
- n_mels: 80
8
- padding: center
9
-
10
- backbone:
11
- class_path: vocos.models.VocosBackbone
12
- init_args:
13
- input_channels: 80
14
- dim: 512
15
- intermediate_dim: 1536
16
- num_layers: 8
17
-
18
- head:
19
- class_path: vocos.heads.ISTFTHead
20
- init_args:
21
- dim: 512
22
- n_fft: 1024
23
- hop_length: 256
24
- padding: center
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
infer_onnx.py CHANGED
@@ -33,7 +33,7 @@ def process_text(i: int, text: str, device: torch.device):
33
  MODEL_PATH_MATCHA_MEL="matcha_multispeaker_cat_opset_15_10_steps_lastwords.onnx"
34
  MODEL_PATH_MATCHA="matcha_hifigan_multispeaker_cat.onnx"
35
  MODEL_PATH_VOCOS="mel_spec_22khz_v2.onnx"
36
- CONFIG_PATH="config_22khz.yaml"
37
  SPEAKER_ID_DICT="spk_to_id.json"
38
 
39
  sess_options = onnxruntime.SessionOptions()
 
33
  MODEL_PATH_MATCHA_MEL="matcha_multispeaker_cat_opset_15_10_steps_lastwords.onnx"
34
  MODEL_PATH_MATCHA="matcha_hifigan_multispeaker_cat.onnx"
35
  MODEL_PATH_VOCOS="mel_spec_22khz_v2.onnx"
36
+ CONFIG_PATH="config.yaml"
37
  SPEAKER_ID_DICT="spk_to_id.json"
38
 
39
  sess_options = onnxruntime.SessionOptions()