Respair commited on
Commit
6742cf9
·
verified ·
1 Parent(s): 35e3d3e

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +2 -0
  2. vocos/.github/workflows/pypi-release.yml +26 -0
  3. vocos/.gitignore +164 -0
  4. vocos/LICENSE +21 -0
  5. vocos/README.md +124 -0
  6. vocos/configs/vocos-encodec.yaml +86 -0
  7. vocos/configs/vocos-imdct.yaml +86 -0
  8. vocos/configs/vocos-resnet.yaml +86 -0
  9. vocos/configs/vocos.yaml +90 -0
  10. vocos/configs/vocos24.yaml +90 -0
  11. vocos/data/filelist.train +3 -0
  12. vocos/data/filelist.val +500 -0
  13. vocos/data/filelist2.train +3 -0
  14. vocos/logs/lightning_logs/version_24/config.yaml +152 -0
  15. vocos/logs/lightning_logs/version_24/events.out.tfevents.1738102892.104-171-202-79 +3 -0
  16. vocos/logs/lightning_logs/version_24/hparams.yaml +10 -0
  17. vocos/logs/lightning_logs/version_25/checkpoints/last.ckpt +3 -0
  18. vocos/logs/lightning_logs/version_25/checkpoints/vocos_checkpoint_epoch=0_step=16634_val_loss=6.2461.ckpt +3 -0
  19. vocos/logs/lightning_logs/version_25/checkpoints/vocos_checkpoint_epoch=1_step=33268_val_loss=5.4846.ckpt +3 -0
  20. vocos/logs/lightning_logs/version_25/config.yaml +152 -0
  21. vocos/logs/lightning_logs/version_25/events.out.tfevents.1738103019.104-171-202-79 +3 -0
  22. vocos/logs/lightning_logs/version_25/hparams.yaml +10 -0
  23. vocos/logs/lightning_logs/version_26/checkpoints/last.ckpt +3 -0
  24. vocos/logs/lightning_logs/version_26/checkpoints/vocos_checkpoint_epoch=0_step=16634_val_loss=6.8451.ckpt +3 -0
  25. vocos/logs/lightning_logs/version_26/config.yaml +152 -0
  26. vocos/logs/lightning_logs/version_26/events.out.tfevents.1738103077.104-171-202-79 +3 -0
  27. vocos/logs/lightning_logs/version_26/hparams.yaml +10 -0
  28. vocos/logs/lightning_logs/version_27/checkpoints/last.ckpt +3 -0
  29. vocos/logs/lightning_logs/version_27/checkpoints/vocos_checkpoint_epoch=0_step=16634_val_loss=6.0317.ckpt +3 -0
  30. vocos/logs/lightning_logs/version_27/config.yaml +152 -0
  31. vocos/logs/lightning_logs/version_27/events.out.tfevents.1738146591.104-171-202-79 +3 -0
  32. vocos/logs/lightning_logs/version_27/hparams.yaml +10 -0
  33. vocos/logs/lightning_logs/version_28/config.yaml +152 -0
  34. vocos/logs/lightning_logs/version_28/events.out.tfevents.1738155430.104-171-202-79 +3 -0
  35. vocos/logs/lightning_logs/version_28/hparams.yaml +10 -0
  36. vocos/metrics/UTMOS.py +223 -0
  37. vocos/metrics/__pycache__/UTMOS.cpython-311.pyc +0 -0
  38. vocos/metrics/__pycache__/periodicity.cpython-311.pyc +0 -0
  39. vocos/metrics/epoch=3-step=7459.ckpt +3 -0
  40. vocos/metrics/periodicity.py +105 -0
  41. vocos/metrics/wav2vec_small.pt +3 -0
  42. vocos/notebooks/Bark+Vocos.ipynb +264 -0
  43. vocos/requirements-train.txt +8 -0
  44. vocos/requirements.txt +8 -0
  45. vocos/setup.py +39 -0
  46. vocos/train.py +6 -0
  47. vocos/vocos/__init__.py +4 -0
  48. vocos/vocos/__pycache__/__init__.cpython-311.pyc +0 -0
  49. vocos/vocos/__pycache__/dataset.cpython-311.pyc +0 -0
  50. vocos/vocos/__pycache__/discriminators.cpython-311.pyc +0 -0
.gitattributes CHANGED
@@ -33,3 +33,5 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ vocos/data/filelist.train filter=lfs diff=lfs merge=lfs -text
37
+ vocos/data/filelist2.train filter=lfs diff=lfs merge=lfs -text
vocos/.github/workflows/pypi-release.yml ADDED
@@ -0,0 +1,26 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ name: Publish Python package
2
+
3
+ on:
4
+ release:
5
+ types: [published]
6
+
7
+ jobs:
8
+ publish:
9
+ runs-on: ubuntu-latest
10
+ steps:
11
+ - uses: actions/checkout@v3
12
+ - name: Set up Python
13
+ uses: actions/setup-python@v4
14
+ with:
15
+ python-version: "3.x"
16
+ - name: Install pypa/setuptools
17
+ run: >-
18
+ python -m
19
+ pip install wheel
20
+ - name: Build a binary wheel
21
+ run: >-
22
+ python setup.py sdist bdist_wheel
23
+ - name: Publish to PyPI
24
+ uses: pypa/gh-action-pypi-publish@release/v1
25
+ with:
26
+ password: ${{ secrets.PYPI_API_TOKEN }}
vocos/.gitignore ADDED
@@ -0,0 +1,164 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Byte-compiled / optimized / DLL files
2
+ __pycache__/
3
+ *.py[cod]
4
+ *$py.class
5
+
6
+ # C extensions
7
+ *.so
8
+
9
+ # Distribution / packaging
10
+ .Python
11
+ build/
12
+ develop-eggs/
13
+ dist/
14
+ downloads/
15
+ eggs/
16
+ .eggs/
17
+ lib/
18
+ lib64/
19
+ parts/
20
+ sdist/
21
+ var/
22
+ wheels/
23
+ share/python-wheels/
24
+ *.egg-info/
25
+ .installed.cfg
26
+ *.egg
27
+ MANIFEST
28
+
29
+ # PyInstaller
30
+ # Usually these files are written by a python script from a template
31
+ # before PyInstaller builds the exe, so as to inject date/other infos into it.
32
+ *.manifest
33
+ *.spec
34
+
35
+ # Installer logs
36
+ pip-log.txt
37
+ pip-delete-this-directory.txt
38
+
39
+ # Unit test / coverage reports
40
+ htmlcov/
41
+ .tox/
42
+ .nox/
43
+ .coverage
44
+ .coverage.*
45
+ .cache
46
+ nosetests.xml
47
+ coverage.xml
48
+ *.cover
49
+ *.py,cover
50
+ .hypothesis/
51
+ .pytest_cache/
52
+ cover/
53
+
54
+ # Translations
55
+ *.mo
56
+ *.pot
57
+
58
+ # Django stuff:
59
+ *.log
60
+ local_settings.py
61
+ db.sqlite3
62
+ db.sqlite3-journal
63
+
64
+ # Flask stuff:
65
+ instance/
66
+ .webassets-cache
67
+
68
+ # Scrapy stuff:
69
+ .scrapy
70
+
71
+ # Sphinx documentation
72
+ docs/_build/
73
+
74
+ # PyBuilder
75
+ .pybuilder/
76
+ target/
77
+
78
+ # Jupyter Notebook
79
+ .ipynb_checkpoints
80
+
81
+ # IPython
82
+ profile_default/
83
+ ipython_config.py
84
+
85
+ # pyenv
86
+ # For a library or package, you might want to ignore these files since the code is
87
+ # intended to run in multiple environments; otherwise, check them in:
88
+ # .python-version
89
+
90
+ # pipenv
91
+ # According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control.
92
+ # However, in case of collaboration, if having platform-specific dependencies or dependencies
93
+ # having no cross-platform support, pipenv may install dependencies that don't work, or not
94
+ # install all needed dependencies.
95
+ #Pipfile.lock
96
+
97
+ # poetry
98
+ # Similar to Pipfile.lock, it is generally recommended to include poetry.lock in version control.
99
+ # This is especially recommended for binary packages to ensure reproducibility, and is more
100
+ # commonly ignored for libraries.
101
+ # https://python-poetry.org/docs/basic-usage/#commit-your-poetrylock-file-to-version-control
102
+ #poetry.lock
103
+
104
+ # pdm
105
+ # Similar to Pipfile.lock, it is generally recommended to include pdm.lock in version control.
106
+ #pdm.lock
107
+ # pdm stores project-wide configurations in .pdm.toml, but it is recommended to not include it
108
+ # in version control.
109
+ # https://pdm.fming.dev/#use-with-ide
110
+ .pdm.toml
111
+
112
+ # PEP 582; used by e.g. github.com/David-OConnor/pyflow and github.com/pdm-project/pdm
113
+ __pypackages__/
114
+
115
+ # Celery stuff
116
+ celerybeat-schedule
117
+ celerybeat.pid
118
+
119
+ # SageMath parsed files
120
+ *.sage.py
121
+
122
+ # Environments
123
+ .env
124
+ .venv
125
+ env/
126
+ venv/
127
+ ENV/
128
+ env.bak/
129
+ venv.bak/
130
+
131
+ # Spyder project settings
132
+ .spyderproject
133
+ .spyproject
134
+
135
+ # Rope project settings
136
+ .ropeproject
137
+
138
+ # mkdocs documentation
139
+ /site
140
+
141
+ # mypy
142
+ .mypy_cache/
143
+ .dmypy.json
144
+ dmypy.json
145
+
146
+ # Pyre type checker
147
+ .pyre/
148
+
149
+ # pytype static type analyzer
150
+ .pytype/
151
+
152
+ # Cython debug symbols
153
+ cython_debug/
154
+
155
+ # PyCharm
156
+ # JetBrains specific template is maintained in a separate JetBrains.gitignore that can
157
+ # be found at https://github.com/github/gitignore/blob/main/Global/JetBrains.gitignore
158
+ # and can be added to the global gitignore or merged into this file. For a more nuclear
159
+ # option (not recommended) you can uncomment the following to ignore the entire idea folder.
160
+ .idea/
161
+
162
+ logs/
163
+ *.pt
164
+ *.ckpt
vocos/LICENSE ADDED
@@ -0,0 +1,21 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ MIT License
2
+
3
+ Copyright (c) 2023 Charactr Inc.
4
+
5
+ Permission is hereby granted, free of charge, to any person obtaining a copy
6
+ of this software and associated documentation files (the "Software"), to deal
7
+ in the Software without restriction, including without limitation the rights
8
+ to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
9
+ copies of the Software, and to permit persons to whom the Software is
10
+ furnished to do so, subject to the following conditions:
11
+
12
+ The above copyright notice and this permission notice shall be included in all
13
+ copies or substantial portions of the Software.
14
+
15
+ THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16
+ IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17
+ FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
18
+ AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19
+ LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20
+ OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21
+ SOFTWARE.
vocos/README.md ADDED
@@ -0,0 +1,124 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Vocos: Closing the gap between time-domain and Fourier-based neural vocoders for high-quality audio synthesis
2
+
3
+ [Audio samples](https://gemelo-ai.github.io/vocos/) |
4
+ Paper [[abs]](https://arxiv.org/abs/2306.00814) [[pdf]](https://arxiv.org/pdf/2306.00814.pdf)
5
+
6
+ Vocos is a fast neural vocoder designed to synthesize audio waveforms from acoustic features. Trained using a Generative
7
+ Adversarial Network (GAN) objective, Vocos can generate waveforms in a single forward pass. Unlike other typical
8
+ GAN-based vocoders, Vocos does not model audio samples in the time domain. Instead, it generates spectral
9
+ coefficients, facilitating rapid audio reconstruction through inverse Fourier transform.
10
+
11
+ ## Installation
12
+
13
+ To use Vocos only in inference mode, install it using:
14
+
15
+ ```bash
16
+ pip install vocos
17
+ ```
18
+
19
+ If you wish to train the model, install it with additional dependencies:
20
+
21
+ ```bash
22
+ pip install vocos[train]
23
+ ```
24
+
25
+ ## Usage
26
+
27
+ ### Reconstruct audio from mel-spectrogram
28
+
29
+ ```python
30
+ import torch
31
+
32
+ from vocos import Vocos
33
+
34
+ vocos = Vocos.from_pretrained("charactr/vocos-mel-24khz")
35
+
36
+ mel = torch.randn(1, 100, 256) # B, C, T
37
+ audio = vocos.decode(mel)
38
+ ```
39
+
40
+ Copy-synthesis from a file:
41
+
42
+ ```python
43
+ import torchaudio
44
+
45
+ y, sr = torchaudio.load(YOUR_AUDIO_FILE)
46
+ if y.size(0) > 1: # mix to mono
47
+ y = y.mean(dim=0, keepdim=True)
48
+ y = torchaudio.functional.resample(y, orig_freq=sr, new_freq=24000)
49
+ y_hat = vocos(y)
50
+ ```
51
+
52
+ ### Reconstruct audio from EnCodec tokens
53
+
54
+ Additionally, you need to provide a `bandwidth_id` which corresponds to the embedding for bandwidth from the
55
+ list: `[1.5, 3.0, 6.0, 12.0]`.
56
+
57
+ ```python
58
+ vocos = Vocos.from_pretrained("charactr/vocos-encodec-24khz")
59
+
60
+ audio_tokens = torch.randint(low=0, high=1024, size=(8, 200)) # 8 codeboooks, 200 frames
61
+ features = vocos.codes_to_features(audio_tokens)
62
+ bandwidth_id = torch.tensor([2]) # 6 kbps
63
+
64
+ audio = vocos.decode(features, bandwidth_id=bandwidth_id)
65
+ ```
66
+
67
+ Copy-synthesis from a file: It extracts and quantizes features with EnCodec, then reconstructs them with Vocos in a
68
+ single forward pass.
69
+
70
+ ```python
71
+ y, sr = torchaudio.load(YOUR_AUDIO_FILE)
72
+ if y.size(0) > 1: # mix to mono
73
+ y = y.mean(dim=0, keepdim=True)
74
+ y = torchaudio.functional.resample(y, orig_freq=sr, new_freq=24000)
75
+
76
+ y_hat = vocos(y, bandwidth_id=bandwidth_id)
77
+ ```
78
+
79
+ ### Integrate with 🐶 [Bark](https://github.com/suno-ai/bark) text-to-audio model
80
+
81
+ See [example notebook](notebooks%2FBark%2BVocos.ipynb).
82
+
83
+ ## Pre-trained models
84
+
85
+ | Model Name | Dataset | Training Iterations | Parameters
86
+ |-------------------------------------------------------------------------------------|---------------|-------------------|------------|
87
+ | [charactr/vocos-mel-24khz](https://huggingface.co/charactr/vocos-mel-24khz) | LibriTTS | 1M | 13.5M
88
+ | [charactr/vocos-encodec-24khz](https://huggingface.co/charactr/vocos-encodec-24khz) | DNS Challenge | 2M | 7.9M
89
+
90
+ ## Training
91
+
92
+ Prepare a filelist of audio files for the training and validation set:
93
+
94
+ ```bash
95
+ find $TRAIN_DATASET_DIR -name *.wav > filelist.train
96
+ find $VAL_DATASET_DIR -name *.wav > filelist.val
97
+ ```
98
+
99
+ Fill a config file, e.g. [vocos.yaml](configs%2Fvocos.yaml), with your filelist paths and start training with:
100
+
101
+ ```bash
102
+ python train.py -c configs/vocos.yaml
103
+ ```
104
+
105
+ Refer to [Pytorch Lightning documentation](https://lightning.ai/docs/pytorch/stable/) for details about customizing the
106
+ training pipeline.
107
+
108
+ ## Citation
109
+
110
+ If this code contributes to your research, please cite our work:
111
+
112
+ ```
113
+ @article{siuzdak2023vocos,
114
+ title={Vocos: Closing the gap between time-domain and Fourier-based neural vocoders for high-quality audio synthesis},
115
+ author={Siuzdak, Hubert},
116
+ journal={arXiv preprint arXiv:2306.00814},
117
+ year={2023}
118
+ }
119
+ ```
120
+
121
+ ## License
122
+
123
+ The code in this repository is released under the MIT license as found in the
124
+ [LICENSE](LICENSE) file.
vocos/configs/vocos-encodec.yaml ADDED
@@ -0,0 +1,86 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # pytorch_lightning==1.8.6
2
+ seed_everything: 4444
3
+
4
+ data:
5
+ class_path: vocos.dataset.VocosDataModule
6
+ init_args:
7
+ train_params:
8
+ filelist_path: ???
9
+ sampling_rate: 24000
10
+ num_samples: 24000
11
+ batch_size: 16
12
+ num_workers: 8
13
+
14
+ val_params:
15
+ filelist_path: ???
16
+ sampling_rate: 24000
17
+ num_samples: 24000
18
+ batch_size: 16
19
+ num_workers: 8
20
+
21
+ model:
22
+ class_path: vocos.experiment.VocosEncodecExp
23
+ init_args:
24
+ sample_rate: 24000
25
+ initial_learning_rate: 5e-4
26
+ mel_loss_coeff: 45
27
+ mrd_loss_coeff: 1.0
28
+ num_warmup_steps: 0 # Optimizers warmup steps
29
+ pretrain_mel_steps: 0 # 0 means GAN objective from the first iteration
30
+
31
+ # automatic evaluation
32
+ evaluate_utmos: true
33
+ evaluate_pesq: true
34
+ evaluate_periodicty: true
35
+
36
+ feature_extractor:
37
+ class_path: vocos.feature_extractors.EncodecFeatures
38
+ init_args:
39
+ encodec_model: encodec_24khz
40
+ bandwidths: [1.5, 3.0, 6.0, 12.0]
41
+ train_codebooks: false
42
+
43
+ backbone:
44
+ class_path: vocos.models.VocosBackbone
45
+ init_args:
46
+ input_channels: 128
47
+ dim: 384
48
+ intermediate_dim: 1152
49
+ num_layers: 8
50
+ adanorm_num_embeddings: 4 # len(bandwidths)
51
+
52
+ head:
53
+ class_path: vocos.heads.ISTFTHead
54
+ init_args:
55
+ dim: 384
56
+ n_fft: 1280
57
+ hop_length: 320
58
+ padding: same
59
+
60
+ trainer:
61
+ logger:
62
+ class_path: pytorch_lightning.loggers.TensorBoardLogger
63
+ init_args:
64
+ save_dir: logs/
65
+ callbacks:
66
+ - class_path: pytorch_lightning.callbacks.LearningRateMonitor
67
+ - class_path: pytorch_lightning.callbacks.ModelSummary
68
+ init_args:
69
+ max_depth: 2
70
+ - class_path: pytorch_lightning.callbacks.ModelCheckpoint
71
+ init_args:
72
+ monitor: val_loss
73
+ filename: vocos_checkpoint_{epoch}_{step}_{val_loss:.4f}
74
+ save_top_k: 3
75
+ save_last: true
76
+ - class_path: vocos.helpers.GradNormCallback
77
+
78
+ # Lightning calculates max_steps across all optimizer steps (rather than number of batches)
79
+ # This equals to 1M steps per generator and 1M per discriminator
80
+ max_steps: 2000000
81
+ # You might want to limit val batches when evaluating all the metrics, as they are time-consuming
82
+ limit_val_batches: 100
83
+ accelerator: gpu
84
+ strategy: ddp
85
+ devices: [0]
86
+ log_every_n_steps: 100
vocos/configs/vocos-imdct.yaml ADDED
@@ -0,0 +1,86 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # pytorch_lightning==1.8.6
2
+ seed_everything: 4444
3
+
4
+ data:
5
+ class_path: vocos.dataset.VocosDataModule
6
+ init_args:
7
+ train_params:
8
+ filelist_path: ???
9
+ sampling_rate: 24000
10
+ num_samples: 16384
11
+ batch_size: 16
12
+ num_workers: 8
13
+
14
+ val_params:
15
+ filelist_path: ???
16
+ sampling_rate: 24000
17
+ num_samples: 48384
18
+ batch_size: 16
19
+ num_workers: 8
20
+
21
+ model:
22
+ class_path: vocos.experiment.VocosExp
23
+ init_args:
24
+ sample_rate: 24000
25
+ initial_learning_rate: 5e-4
26
+ mel_loss_coeff: 45
27
+ mrd_loss_coeff: 0.1
28
+ num_warmup_steps: 0 # Optimizers warmup steps
29
+ pretrain_mel_steps: 0 # 0 means GAN objective from the first iteration
30
+
31
+ # automatic evaluation
32
+ evaluate_utmos: true
33
+ evaluate_pesq: true
34
+ evaluate_periodicty: true
35
+
36
+ feature_extractor:
37
+ class_path: vocos.feature_extractors.MelSpectrogramFeatures
38
+ init_args:
39
+ sample_rate: 24000
40
+ n_fft: 1024
41
+ hop_length: 256
42
+ n_mels: 100
43
+ padding: center
44
+
45
+ backbone:
46
+ class_path: vocos.models.VocosBackbone
47
+ init_args:
48
+ input_channels: 100
49
+ dim: 512
50
+ intermediate_dim: 1536
51
+ num_layers: 8
52
+
53
+ head:
54
+ class_path: vocos.heads.IMDCTCosHead
55
+ init_args:
56
+ dim: 512
57
+ mdct_frame_len: 512 # mel-spec hop_length * 2
58
+ padding: center
59
+
60
+ trainer:
61
+ logger:
62
+ class_path: pytorch_lightning.loggers.TensorBoardLogger
63
+ init_args:
64
+ save_dir: logs/
65
+ callbacks:
66
+ - class_path: pytorch_lightning.callbacks.LearningRateMonitor
67
+ - class_path: pytorch_lightning.callbacks.ModelSummary
68
+ init_args:
69
+ max_depth: 2
70
+ - class_path: pytorch_lightning.callbacks.ModelCheckpoint
71
+ init_args:
72
+ monitor: val_loss
73
+ filename: vocos_checkpoint_{epoch}_{step}_{val_loss:.4f}
74
+ save_top_k: 3
75
+ save_last: true
76
+ - class_path: vocos.helpers.GradNormCallback
77
+
78
+ # Lightning calculates max_steps across all optimizer steps (rather than number of batches)
79
+ # This equals to 1M steps per generator and 1M per discriminator
80
+ max_steps: 2000000
81
+ # You might want to limit val batches when evaluating all the metrics, as they are time-consuming
82
+ limit_val_batches: 100
83
+ accelerator: gpu
84
+ strategy: ddp
85
+ devices: [0]
86
+ log_every_n_steps: 100
vocos/configs/vocos-resnet.yaml ADDED
@@ -0,0 +1,86 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # pytorch_lightning==1.8.6
2
+ seed_everything: 4444
3
+
4
+ data:
5
+ class_path: vocos.dataset.VocosDataModule
6
+ init_args:
7
+ train_params:
8
+ filelist_path: ???
9
+ sampling_rate: 24000
10
+ num_samples: 16384
11
+ batch_size: 16
12
+ num_workers: 8
13
+
14
+ val_params:
15
+ filelist_path: ???
16
+ sampling_rate: 24000
17
+ num_samples: 48384
18
+ batch_size: 16
19
+ num_workers: 8
20
+
21
+ model:
22
+ class_path: vocos.experiment.VocosExp
23
+ init_args:
24
+ sample_rate: 24000
25
+ initial_learning_rate: 5e-4
26
+ mel_loss_coeff: 45
27
+ mrd_loss_coeff: 0.1
28
+ num_warmup_steps: 0 # Optimizers warmup steps
29
+ pretrain_mel_steps: 0 # 0 means GAN objective from the first iteration
30
+
31
+ # automatic evaluation
32
+ evaluate_utmos: true
33
+ evaluate_pesq: true
34
+ evaluate_periodicty: true
35
+
36
+ feature_extractor:
37
+ class_path: vocos.feature_extractors.MelSpectrogramFeatures
38
+ init_args:
39
+ sample_rate: 24000
40
+ n_fft: 1024
41
+ hop_length: 256
42
+ n_mels: 100
43
+ padding: center
44
+
45
+ backbone:
46
+ class_path: vocos.models.VocosResNetBackbone
47
+ init_args:
48
+ input_channels: 100
49
+ dim: 512
50
+ num_blocks: 3
51
+
52
+ head:
53
+ class_path: vocos.heads.ISTFTHead
54
+ init_args:
55
+ dim: 512
56
+ n_fft: 1024
57
+ hop_length: 256
58
+ padding: center
59
+
60
+ trainer:
61
+ logger:
62
+ class_path: pytorch_lightning.loggers.TensorBoardLogger
63
+ init_args:
64
+ save_dir: logs/
65
+ callbacks:
66
+ - class_path: pytorch_lightning.callbacks.LearningRateMonitor
67
+ - class_path: pytorch_lightning.callbacks.ModelSummary
68
+ init_args:
69
+ max_depth: 2
70
+ - class_path: pytorch_lightning.callbacks.ModelCheckpoint
71
+ init_args:
72
+ monitor: val_loss
73
+ filename: vocos_checkpoint_{epoch}_{step}_{val_loss:.4f}
74
+ save_top_k: 3
75
+ save_last: true
76
+ - class_path: vocos.helpers.GradNormCallback
77
+
78
+ # Lightning calculates max_steps across all optimizer steps (rather than number of batches)
79
+ # This equals to 1M steps per generator and 1M per discriminator
80
+ max_steps: 2000000
81
+ # You might want to limit val batches when evaluating all the metrics, as they are time-consuming
82
+ limit_val_batches: 100
83
+ accelerator: gpu
84
+ strategy: ddp
85
+ devices: [0]
86
+ log_every_n_steps: 100
vocos/configs/vocos.yaml ADDED
@@ -0,0 +1,90 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # pytorch_lightning==1.8.6
2
+ seed_everything: 4444
3
+
4
+ data:
5
+ class_path: vocos.dataset.VocosDataModule
6
+ init_args:
7
+ train_params:
8
+ filelist_path: "/home/ubuntu/vocos/data/filelist.train"
9
+ sampling_rate: 44100
10
+ num_samples: 65536
11
+ batch_size: 58
12
+ num_workers: 8
13
+
14
+ val_params:
15
+ filelist_path: "/home/ubuntu/vocos/data/filelist.val"
16
+ sampling_rate: 44100
17
+ num_samples: 65536
18
+ batch_size: 16
19
+ num_workers: 8
20
+
21
+ model:
22
+ class_path: vocos.experiment.VocosExp
23
+ init_args:
24
+ sample_rate: 44100
25
+ initial_learning_rate: 5e-4
26
+ mel_loss_coeff: 45
27
+ mrd_loss_coeff: 0.1
28
+ num_warmup_steps: 0 # Optimizers warmup steps
29
+ pretrain_mel_steps: 0 # 0 means GAN objective from the first iteration
30
+
31
+ # automatic evaluation
32
+ evaluate_utmos: true
33
+ evaluate_pesq: true
34
+ evaluate_periodicty: true
35
+
36
+ feature_extractor:
37
+ class_path: vocos.feature_extractors.MelSpectrogramFeatures
38
+ init_args:
39
+ sample_rate: 44100
40
+ n_fft: 2048
41
+ hop_length: 512
42
+ win_length: 2048
43
+ n_mels: 128
44
+ padding: center
45
+
46
+ backbone:
47
+ class_path: vocos.models.VocosBackbone
48
+ init_args:
49
+ input_channels: 128
50
+ dim: 512
51
+ intermediate_dim: 1536
52
+ num_layers: 8
53
+
54
+ head:
55
+ class_path: vocos.heads.ISTFTHead
56
+ init_args:
57
+ dim: 512
58
+ n_fft: 2048
59
+ hop_length: 512
60
+ padding: center
61
+
62
+ trainer:
63
+ logger:
64
+ class_path: pytorch_lightning.loggers.TensorBoardLogger
65
+ init_args:
66
+ save_dir: logs/
67
+ callbacks:
68
+ - class_path: pytorch_lightning.callbacks.LearningRateMonitor
69
+ - class_path: pytorch_lightning.callbacks.ModelSummary
70
+ init_args:
71
+ max_depth: 2
72
+ - class_path: pytorch_lightning.callbacks.ModelCheckpoint
73
+ init_args:
74
+ # every_n_train_steps: 5000
75
+ # filename: vocos_checkpoint_step_{step}
76
+ monitor: val_loss
77
+ filename: vocos_checkpoint_{epoch}_{step}_{val_loss:.4f}
78
+ save_top_k: 3
79
+ save_last: true
80
+ - class_path: vocos.helpers.GradNormCallback
81
+
82
+ # Lightning calculates max_steps across all optimizer steps (rather than number of batches)
83
+ # This equals to 1M steps per generator and 1M per discriminator
84
+ max_steps: 2000000
85
+ # You might want to limit val batches when evaluating all the metrics, as they are time-consuming
86
+ limit_val_batches: 50
87
+ accelerator: gpu
88
+ strategy: ddp
89
+ devices: [0,1]
90
+ log_every_n_steps: 100
vocos/configs/vocos24.yaml ADDED
@@ -0,0 +1,90 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # pytorch_lightning==1.8.6
2
+ seed_everything: 4444
3
+
4
+ data:
5
+ class_path: vocos.dataset.VocosDataModule
6
+ init_args:
7
+ train_params:
8
+ filelist_path: "/home/ubuntu/vocos/data/filelist2.train"
9
+ sampling_rate: 24000
10
+ num_samples: 57600
11
+ batch_size: 64
12
+ num_workers: 8
13
+
14
+ val_params:
15
+ filelist_path: "/home/ubuntu/vocos/data/filelist.val"
16
+ sampling_rate: 24000
17
+ num_samples: 57600
18
+ batch_size: 16
19
+ num_workers: 8
20
+
21
+ model:
22
+ class_path: vocos.experiment.VocosExp
23
+ init_args:
24
+ sample_rate: 24000
25
+ initial_learning_rate: 5e-4
26
+ mel_loss_coeff: 45
27
+ mrd_loss_coeff: 0.1
28
+ num_warmup_steps: 0 # Optimizers warmup steps
29
+ pretrain_mel_steps: 0 # 0 means GAN objective from the first iteration
30
+
31
+ # automatic evaluation
32
+ evaluate_utmos: true
33
+ evaluate_pesq: true
34
+ evaluate_periodicty: true
35
+
36
+ feature_extractor:
37
+ class_path: vocos.feature_extractors.MelSpectrogramFeatures
38
+ init_args:
39
+ sample_rate: 24000
40
+ n_fft: 2048
41
+ hop_length: 300
42
+ win_length: 1200
43
+ n_mels: 80
44
+ padding: center
45
+
46
+ backbone:
47
+ class_path: vocos.models.VocosBackbone
48
+ init_args:
49
+ input_channels: 80
50
+ dim: 512
51
+ intermediate_dim: 1536
52
+ num_layers: 8
53
+
54
+ head:
55
+ class_path: vocos.heads.ISTFTHead
56
+ init_args:
57
+ dim: 512
58
+ n_fft: 2048
59
+ hop_length: 300
60
+ padding: center
61
+
62
+ trainer:
63
+ logger:
64
+ class_path: pytorch_lightning.loggers.TensorBoardLogger
65
+ init_args:
66
+ save_dir: logs/
67
+ callbacks:
68
+ - class_path: pytorch_lightning.callbacks.LearningRateMonitor
69
+ - class_path: pytorch_lightning.callbacks.ModelSummary
70
+ init_args:
71
+ max_depth: 2
72
+ - class_path: pytorch_lightning.callbacks.ModelCheckpoint
73
+ init_args:
74
+ # every_n_train_steps: 5000
75
+ # filename: vocos_checkpoint_step_{step}
76
+ monitor: val_loss
77
+ filename: vocos_checkpoint_{epoch}_{step}_{val_loss:.4f}
78
+ save_top_k: 3
79
+ save_last: true
80
+ - class_path: vocos.helpers.GradNormCallback
81
+
82
+ # Lightning calculates max_steps across all optimizer steps (rather than number of batches)
83
+ # This equals to 1M steps per generator and 1M per discriminator
84
+ max_steps: 2000000
85
+ # You might want to limit val batches when evaluating all the metrics, as they are time-consuming
86
+ limit_val_batches: 50
87
+ accelerator: gpu
88
+ strategy: ddp
89
+ devices: [0,1]
90
+ log_every_n_steps: 100
vocos/data/filelist.train ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:186a28c6524b34bcdfbbe01ed42257db16753ce1e35770385e004fb6ea7219b8
3
+ size 150129204
vocos/data/filelist.val ADDED
@@ -0,0 +1,500 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/HF_temp/games/BD3/BG3_Rest/Gale/BG3 Voice Lines: Gale [CpasYgOyyl4]_part_003/BG3 Voice Lines: Gale [CpasYgOyyl4]_part_003_chunk1424.mp3
2
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم القصص/النوم عند قدمي الجبل/النوم عند قدمي الجبل_chunk854.mp3
3
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم القصص/حجرتان وصالة/حجرتان وصالة_chunk715.mp3
4
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/Ruski_scraped_chunks/youtube/sychev/СЕМЕЙНЫЙ ЮРИСТ. Развод, алименты и раздел имущества [gp2-6PZBZmU]/СЕМЕ_speaker_SPEAKER_00/СЕМЕ_speaker_SPEAKER_00_chunk513.mp3
5
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/أبابيل/أبابيل_chunk979.mp3
6
+ /home/ubuntu/respair/jpn/moe/2cf01874/wav/2cf01874_1845.wav
7
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/debate_chunks/Is Amazon Good For Small Business? [x6hj-XeDKD4]/Is A_speaker_SPEAKER_05/Is A_speaker_SPEAKER_05_chunk93.wav
8
+ /home/ubuntu/respair/data_cache/Final_Persian/رویا میرعلمی/dfe42e8c-acda-4b52-b0e6-8f02cdc9dbde/dfe42e8c-acda-4b52-b0e6-8f02cdc9dbde_chunk182.mp3
9
+ /home/ubuntu/respair/data_cache/Final_Persian/امیررضا علی زاده/1a762047-afb4-4b6a-a2ae-62b6e80edcbd/1a762047-afb4-4b6a-a2ae-62b6e80edcbd_chunk165.mp3
10
+ /home/ubuntu/respair/jpn/moe/917feebd/wav/917feebd_2750.wav
11
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/Ruski_scraped_chunks/youtube/sychev/ЛОГОПЕД. Развитие речи, постановка звуков, массаж и подрезание уздечки [ra3U7s-VZzI]/ЛОГО_speaker_SPEAKER_03/ЛОГО_speaker_SPEAKER_03_chunk183.mp3
12
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/Ruski_scraped_chunks/youtube/sychev/НАСКОЛЬКО ТЫ МУЖИК? Про барбершопы, лысые яйца и давление общества [y2CUqJKfAY8]/НАСК_speaker_SPEAKER_05/НАСК_speaker_SPEAKER_05_chunk414.mp3
13
+ /home/ubuntu/respair/jpn/soshy/Japanese/imas_split/mayu/mayu_cgss/mayu_cgss_card_100270/mayu_cgss_voice_100270_2_03.wav
14
+ /home/ubuntu/respair/data_cache/English_Final/with_ids/Ani_speech/audio_13604.wav
15
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/audiobooks_25P/Сарко Де Рази - Украденный свет/Сарк_speaker_SPEAKER_00/Сарк_speaker_SPEAKER_00_chunk277.mp3
16
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/نون/نون_chunk636.mp3
17
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/Ruski_scraped_chunks/youtube/vedud/Муратов – что происходит с Россией [z1C01Gc9w-w]/Мура_speaker_SPEAKER_01/Мура_speaker_SPEAKER_01_chunk410.mp3
18
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/HF_temp/games/BD3/BG3_Rest/Laezel/BG3 Voice Lines: Lae'zel [q-Z-9hfSirg]_part_003/BG3 Voice Lines: Lae'zel [q-Z-9hfSirg]_part_003_chunk866.mp3
19
+ /home/ubuntu/respair/data_cache/English_Final/with_ids/ylac/ylacombe_expresso/Ylacombe_Expresso_audio_3273_P3.wav
20
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/اليهودي والفتاة العربية/اليهودي والفتاة العربية_chunk1513.mp3
21
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم القصص/علامات الحب السبعة/علامات الحب السبعة_chunk560.mp3
22
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/audiobooks_25P/Василий Головачев - Спасатели Веера 1 - Посланник_part_002/Васи_speaker_SPEAKER_01/Васи_speaker_SPEAKER_01_chunk455.mp3
23
+ /home/ubuntu/respair/data_cache/Final_Persian/هدا صدر/7bdf73a0-1db6-413c-a363-4e0f55aa4433/7bdf73a0-1db6-413c-a363-4e0f55aa4433_chunk103.mp3
24
+ /home/ubuntu/respair/jpn/soshy/Japanese/imas_split/ranko/ranko_mobamas/ranko_mobamasu_0018/ranko_mobamasu_0018_chunk72.wav
25
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/امرأة في مكان آخر/امرأة في مكان آخر_chunk1577.mp3
26
+ /home/ubuntu/respair/jpn/soshy/Japanese/monogatari/monogatari_voices/monogatari_split/sakurai_takahiro/Sakurai_Takahiro_01/Sakurai_Takahiro_01_chunk1470.wav
27
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم القصص/قميص تكويه إمرأتان/قميص تكويه إمرأتان_chunk801.mp3
28
+ /home/ubuntu/respair/data_cache/Final_Persian/امیرمحمد صمصامی/5ad3f710-83cd-4775-9ec4-b72e514bebfc/5ad3f710-83cd-4775-9ec4-b72e514bebfc_chunk162.mp3
29
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/Ruski_scraped_chunks/ruski_mix/Становясь волшебницей (1-13 серия) [Dreamcast] [BD 1080] -185087421_456245995 audio only/Стан_speaker_SPEAKER_07/Стан_speaker_SPEAKER_07_chunk946.mp3
30
+ /home/ubuntu/respair/jpn/soshy/Japanese/imas_split/ranko/ranko_cgss/ranko_card_200796/ranko_voice_200796_4_02.wav
31
+ /home/ubuntu/respair/data_cache/Final_Persian/آیلار محمدی/5e44498f-d33b-46ae-b18b-dfd841a4b949/5e44498f-d33b-46ae-b18b-dfd841a4b949_chunk362.mp3
32
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/whispering_chunks/ASMR - ANNUAL EAR CLEANING [Hk9dtOkOPro]/ASMR - ANNUAL EAR CLEANING [Hk9dtOkOPro]_chunk262.mp3
33
+ /home/ubuntu/respair/data_cache/Final_Rusiki/wth_ids/ru_youtube/ru_youtube_dataset_audio_2010.wav
34
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم القصص/طرق سرية للجموح/طرق سرية للجموح_chunk203.mp3
35
+ /home/ubuntu/respair/data_cache/Final_Persian/لیلا ولی پور/6437de3d-b9ae-4c82-a00e-991a14e3731b/6437de3d-b9ae-4c82-a00e-991a14e3731b_chunk82.mp3
36
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/debate_chunks/Thinking Twice: Revenge of the Tipping Point with Malcolm Gladwell [l2tCLI29S4k]/Thin_speaker_SPEAKER_04/Thin_speaker_SPEAKER_04_chunk410.wav
37
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم القصص/تقتلني أو أكتبها/تقتلني أو أكتبها_chunk32.mp3
38
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/HF_temp/games/Disco/Kim Kitsuragi Voice Lines (Disco Elyisum) [c5qHI57fkFE]_part_002/Kim Kitsuragi Voice Lines (Disco Elyisum) [c5qHI57fkFE]_part_002_chunk1446.mp3
39
+ /home/ubuntu/respair/data_cache/Final_Persian/امیررضا علی زاده/6dfaaafb-65c5-4dbe-b908-40bc822d74bc/6dfaaafb-65c5-4dbe-b908-40bc822d74bc_chunk401.mp3
40
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم القصص/دفتر الغربة/دفتر الغربة_chunk1173.mp3
41
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/audiobooks_25P/Валерий Цуркан - Пять веков туда и обратно/Вале_speaker_SPEAKER_02/Вале_speaker_SPEAKER_02_chunk218.mp3
42
+ /home/ubuntu/respair/jpn/soshy/Japanese/imas_split/shiki/shiki_cgss/shiki_card_100101/shiki_voice_100101_2_05.wav
43
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/Ruski_scraped_chunks/inga/inga_clean/Анна Джейн_08/Анна Джейн_08_chunk276.mp3
44
+ /home/ubuntu/respair/data_cache/Final_Persian/فاطمه ساعدی/f658ca03-a5ef-4ee5-91e9-541c82206bd3/f658ca03-a5ef-4ee5-91e9-541c82206bd3_chunk305.mp3
45
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/Ruski_scraped_chunks/youtube/sychev/ЖИЗНЬ С ШИЗОФРЕНИЕЙ-2. Aline in Wonderland. Принудительная госпитализация [iTysDG98Tw8]/ЖИЗН_speaker_SPEAKER_01/ЖИЗН_speaker_SPEAKER_01_chunk530.mp3
46
+ /home/ubuntu/respair/data_cache/Final_Persian/ساعد باقری/99aaa9f7-ad53-449d-94d0-506c4557c240/99aaa9f7-ad53-449d-94d0-506c4557c240_chunk369.mp3
47
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم القصص/اللعبة/اللعبة_chunk265.mp3
48
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/Ruski_scraped_chunks/inga/inga_clean/Тодд_P_44_Samye yarkie zvYozdy/Тодд_P_44_Samye yarkie zvYozdy_chunk16.mp3
49
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم القصص/سندريلات مسقط/سندريلات مسقط_chunk229.mp3
50
+ /home/ubuntu/respair/data_cache/Final_Persian/ب‍ی‍ژن ارژن/54c54f7a-36c5-45be-97a3-47f5fb2e74b2/54c54f7a-36c5-45be-97a3-47f5fb2e74b2_chunk9.mp3
51
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/audiobooks_25P/Вадим Ечеистов - В тумане/Вади_speaker_SPEAKER_00/Вади_speaker_SPEAKER_00_chunk729.mp3
52
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/Ruski_scraped_chunks/youtube/vedud/ещенепознер – до и во время войны ⧸ before and during the war [mh-7jvePXF4]/ещен_speaker_SPEAKER_09/ещен_speaker_SPEAKER_09_chunk405.mp3
53
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/HF_temp/games/Disco/Composure Voice Lines (Disco Elysium) [88ib4sPXm2Q]/Composure Voice Lines (Disco Elysium) [88ib4sPXm2Q]_chunk962.mp3
54
+ /home/ubuntu/respair/data_cache/Final_Persian/بیتا خداداد/633ebac7-ba61-491c-8941-cbc0946f708d/633ebac7-ba61-491c-8941-cbc0946f708d_chunk144.mp3
55
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/HF_temp/games/Disco/Inland Empire Voice Lines (Disco Elysium) [qY45lCTGmKc]/Inland Empire Voice Lines (Disco Elysium) [qY45lCTGmKc]_chunk1892.mp3
56
+ /home/ubuntu/respair/data_cache/Final_Persian/مونا فرجاد/b2f3bae3-15fc-43ed-8d2e-2fa8eb65e55e/b2f3bae3-15fc-43ed-8d2e-2fa8eb65e55e_chunk40.mp3
57
+ /home/ubuntu/respair/data_cache/Final_Persian/پویا پورهمدانی/6d7aa3f8-764c-4020-967f-d795940c405c/6d7aa3f8-764c-4020-967f-d795940c405c_chunk595.mp3
58
+ /home/ubuntu/respair/jpn/soshy/Japanese/monogatari/monogatari_voices/monogatari_split/shinichiro_miki/Shinichiro_Miki__02/Shinichiro_Miki__02_chunk1525.wav
59
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/HF_temp/games/Disco/Kim Kitsuragi Voice Lines (Disco Elyisum) [c5qHI57fkFE]_part_002/Kim Kitsuragi Voice Lines (Disco Elyisum) [c5qHI57fkFE]_part_002_chunk1519.mp3
60
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/إيفوريا/إيفوريا_chunk1570.mp3
61
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/HF_temp/games/BD3/BG3_Rest/Astrion/BG3 Voice Lines: Astarion (part 2) [yZaGVMN9zGM]/BG3 Voice Lines: Astarion (part 2) [yZaGVMN9zGM]_chunk4878.mp3
62
+ /home/ubuntu/respair/data_cache/Final_Persian/سیاوش رستمی/9334a34f-dc29-4c00-81ec-51ee8f63d45f/9334a34f-dc29-4c00-81ec-51ee8f63d45f_chunk173.mp3
63
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/Ruski_scraped_chunks/inga/inga_clean/Тодд_P_70_Samye yarkie zvYozdy/Тодд_P_70_Samye yarkie zvYozdy_chunk28.mp3
64
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/طارىء/طارىء_chunk753.mp3
65
+ /home/ubuntu/respair/jpn/soshy/Japanese/imas_split/arisu/arisu_mobamasu/2_arisu__0002_(Vocals)/2_arisu__0002_(Vocals)_chunk31.wav
66
+ /home/ubuntu/respair/jpn/moe/cc948b89/wav/cc948b89_1994.wav
67
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/ظلال الكولوسيوم/ظلال الكولوسيوم_chunk126.mp3
68
+ /home/ubuntu/respair/jpn/moe/b8b5fe66/wav/b8b5fe66_0999.wav
69
+ /home/ubuntu/respair/data_cache/Final_Persian/سحر چوبدار/2d00c6fb-d3d8-4b60-a90f-ffdb45c8e3e5/2d00c6fb-d3d8-4b60-a90f-ffdb45c8e3e5_chunk6.mp3
70
+ /home/ubuntu/respair/data_cache/English_Final/with_ids/ylac/ylacombe_podcast/Ylacombe_podcast_audio_1325_P2.wav
71
+ /home/ubuntu/respair/jpn/soshy/Japanese/tsujido/vo/010/S010_F_0022.wav
72
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/لأنها استثناء/لأنها استثناء_chunk873.mp3
73
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/رسائل الأحزان في فلسفة الجمال والحب/رسائل الأحزان في فلسفة الجمال والحب_chunk856.mp3
74
+ /home/ubuntu/respair/data_cache/Final_Rusiki/wth_ids/22khz/22khz/audiobook_rus_dataset_22khz_audio_5777.wav
75
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/debate_chunks/Election 2024: Are Identity Politics Holding Us Back? Coleman Hughes vs. Alicia Garza [3G0_0WRV7KM]/Elec_speaker_SPEAKER_00/Elec_speaker_SPEAKER_00_chunk105.wav
76
+ /home/ubuntu/respair/data_cache/Final_Persian/پژمان ابوالقاسمی/dc3e4253-0d7d-43a5-9fc1-ec500f633a21/dc3e4253-0d7d-43a5-9fc1-ec500f633a21_chunk270.mp3
77
+ /home/ubuntu/respair/data_cache/Final_Persian/محیا ساعدی/64717f7d-20a3-4993-8422-c34b24f20815/64717f7d-20a3-4993-8422-c34b24f20815_chunk135.mp3
78
+ /home/ubuntu/respair/data_cache/Final_Rusiki/wth_ids/ru_youtube/ru_youtube_dataset_audio_1704.wav
79
+ /home/ubuntu/respair/jpn/moe/773a4156/wav/773a4156_2111.wav
80
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/علي السوري/علي السوري_chunk527.mp3
81
+ /home/ubuntu/respair/data_cache/Final_Persian/سارا فیض/46f33750-c90b-4237-863c-2f557965e990/46f33750-c90b-4237-863c-2f557965e990_chunk144.mp3
82
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم القصص/قميص تكويه إمرأتان/قميص تكويه إمرأتان_chunk935.mp3
83
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/Ruski_scraped_chunks/youtube/frame_turner/КУКОЯКА ‒ ОТВЕТ ИНСТАСАМКЕ, ПОЧЕМУ МЫ ТЕРЯЕМ ДРУЗЕЙ И ПЫТАЕМСЯ ЗАСЛУЖИТЬ ЛЮБОВЬ [6xa3X9ztHXQ]/КУКО_speaker_SPEAKER_02/КУКО_speaker_SPEAKER_02_chunk301.mp3
84
+ /home/ubuntu/respair/jpn/soshy/Japanese/imas_split/Karen/karen_cgss/karen_cgss_card_200463/karen_cgss_voice_200463_1_06.wav
85
+ /home/ubuntu/respair/data_cache/Final_Persian/احمد پوری/6fec69f8-4c30-4061-a516-025768b09302/6fec69f8-4c30-4061-a516-025768b09302_chunk443.mp3
86
+ /home/ubuntu/respair/data_cache/Final_Persian/مریم محبوب/b3d13507-b03f-41c8-ace2-62f47fd9077f/b3d13507-b03f-41c8-ace2-62f47fd9077f_chunk395.mp3
87
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/شيروفوبيا/شيروفوبيا_chunk730.mp3
88
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/نون/نون_chunk1170.mp3
89
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/audiobooks_25P/Джек Лондон - Конец сказки/Джек_speaker_SPEAKER_00/Джек_speaker_SPEAKER_00_chunk37.mp3
90
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/audiobooks_25P/Патрик Несс - Поступь Хаоса_part_002/Патр_speaker_SPEAKER_00/Патр_speaker_SPEAKER_00_chunk50.mp3
91
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/debate_chunks/#Debate: Are Men Finished and Should We Help Them? Richard Reeves vs. Hanna Rosin [FlT5clM4WfA]/#Deb_speaker_SPEAKER_02/#Deb_speaker_SPEAKER_02_chunk18.wav
92
+ /home/ubuntu/respair/jpn/soshy/Japanese/monogatari/monogatari_voices/monogatari_split/sawashiro_miyuki/Sawashiro_Miyuki_03/Sawashiro_Miyuki_03_chunk1018.wav
93
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/audiobooks_25P/Кейт Лаумер - Король города/Кейт_speaker_SPEAKER_02/Кейт_speaker_SPEAKER_02_chunk1248.mp3
94
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/شهيا كفراق/شهيا كفراق_chunk801.mp3
95
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/أبابيل/أبابيل_chunk1144.mp3
96
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/Ruski_scraped_chunks/youtube/vedud/Костюченко – история современной России ⧸ вДудь [CobxH2gH4pM]/Кост_speaker_SPEAKER_05/Кост_speaker_SPEAKER_05_chunk2022.mp3
97
+ /home/ubuntu/respair/data_cache/Final_Persian/رضا عمرانی/f9c885e4-adf2-41f5-9d1f-e795f9a11fcc/f9c885e4-adf2-41f5-9d1f-e795f9a11fcc_chunk260.mp3
98
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/Ruski_scraped_chunks/youtube/sychev/#1 АВТОТРЁП. Первые отношения, первый поцелуй, первый секс и личные границы [3wGtRRPTJOc]/#1 А_speaker_SPEAKER_02/#1 А_speaker_SPEAKER_02_chunk162.mp3
99
+ /home/ubuntu/respair/data_cache/Final_Persian/فریناز ثریا/d0cc8097-cbae-428f-a050-270596451802/d0cc8097-cbae-428f-a050-270596451802_chunk198.mp3
100
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/Ruski_scraped_chunks/inga/inga_clean/Анна Джейн_12/Анна Джейн_12_chunk220.mp3
101
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/أسيرة الحب/أسيرة الحب_chunk1310.mp3
102
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/Ruski_scraped_chunks/irina/dataset_Yakutenko_Irina_10h_44100_16bit_mono/dataset_Yakutenko_Irina_10h_44100_16bit_mono_chunk5336.wav
103
+ /home/ubuntu/respair/data_cache/Final_Persian/مهرانه امروانی/56697d4e-f417-4872-b1c5-b5186a9989be/56697d4e-f417-4872-b1c5-b5186a9989be_chunk24.mp3
104
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/audiobooks_25P/Алексей Калугин - Лабиринт 3 - Мир без солнца_part_000/Алек_speaker_SPEAKER_00/Алек_speaker_SPEAKER_00_chunk13.mp3
105
+ /home/ubuntu/respair/data_cache/Final_Persian/ساعد باقری/fd0ac02c-34f6-4ffc-a9bf-7c1baa2f95f6/fd0ac02c-34f6-4ffc-a9bf-7c1baa2f95f6_chunk721.mp3
106
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/Ruski_scraped_chunks/youtube/frame_turner/MORGENSHTERN ‒ ЛИЗА, ГАЛЛЮЦИНАЦИИ, ДЕТСКИЕ ТРАВМЫ, ПРИЧИНА РАЗВОДА И СЕКРЕТ УСПЕХА [g1nVX1oPxHE]/MORG_speaker_SPEAKER_11/MORG_speaker_SPEAKER_11_chunk682.mp3
107
+ /home/ubuntu/respair/jpn/soshy/Japanese/monogatari/monogatari_voices/monogatari_split/chiwa_saito/Chiwa_Saito_01/Chiwa_Saito_01_chunk1988_chunks/chunk_1.wav
108
+ /home/ubuntu/respair/data_cache/Final_Persian/لیلا ولی پور/c2887b5a-e92a-46b5-8934-9c537c8d121f/c2887b5a-e92a-46b5-8934-9c537c8d121f_chunk150.mp3
109
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/سمعة شریفة/سمعة شریفة_chunk207.mp3
110
+ /home/ubuntu/respair/jpn/moe/84be23bd/wav/84be23bd_0099.wav
111
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/audiobooks_25P/Харлан Эллисон - Бегство к звёздам/Харл_speaker_SPEAKER_00/Харл_speaker_SPEAKER_00_chunk295.mp3
112
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم القصص/نزهة مارشال/نزهة مارشال_chunk918.mp3
113
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/debate_chunks/Debate: Are DEI Mandates for University Faculties a Bad Idea? [eKay5lcv7Ic]/Deba_speaker_SPEAKER_03/Deba_speaker_SPEAKER_03_chunk37.wav
114
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/Ruski_scraped_chunks/youtube/vedud/Маша Гессен – стыдные вопросы про Америку ⧸ вДудь [Q0oRii7zV9A]/Маша_speaker_SPEAKER_01/Маша_speaker_SPEAKER_01_chunk1001.mp3
115
+ /home/ubuntu/respair/jpn/moe/9febd2ae/wav/9febd2ae_0483.wav
116
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/audiobooks_25P/Брайдер Юрий - Против течения/Брай_speaker_SPEAKER_00/Брай_speaker_SPEAKER_00_chunk414.mp3
117
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/HF_temp/games/BD3/BG3_Rest/BG3 Voice Lines: Jaheira [r7HxfsGG0zo]/BG3 Voice Lines: Jaheira [r7HxfsGG0zo]_chunk4152.mp3
118
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/HF_temp/games/BD3/BG3_Rest/BG3 Voice Lines: Minsc [5wO9k1rgRcY]/BG3 Voice Lines: Minsc [5wO9k1rgRcY]_chunk121.mp3
119
+ /home/ubuntu/respair/data_cache/Final_Persian/بهار کاتوزی/eb02fc7d-bdfb-45a0-99ff-62bc5e1c0035/eb02fc7d-bdfb-45a0-99ff-62bc5e1c0035_chunk300.mp3
120
+ /home/ubuntu/respair/jpn/moe/773a4156/wav/773a4156_0261.wav
121
+ /home/ubuntu/respair/jpn/moe/8b6e7173/wav/8b6e7173_0839.wav
122
+ /home/ubuntu/respair/jpn/moe/8b6e7173/wav/8b6e7173_1981.wav
123
+ /home/ubuntu/respair/data_cache/Final_Persian/رضا عمرانی/c77d9712-8a2e-4b82-b096-7dca3886d08c/c77d9712-8a2e-4b82-b096-7dca3886d08c_chunk51.mp3
124
+ /home/ubuntu/respair/jpn/soshy/Japanese/tsujido/vo/003/S003_F_0219.wav
125
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/Ruski_scraped_chunks/youtube/sychev/НУТРИЦИОЛОГ Мария Кардакова. Кето диета, питание на ГВ и дисбактериоз [790CGV-gcRg]/НУТР_speaker_SPEAKER_02/НУТР_speaker_SPEAKER_02_chunk151.mp3
126
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/HF_temp/games/BD3/BG3_Rest/Gale/BG3 Voice Lines: Gale [CpasYgOyyl4]_part_002/BG3 Voice Lines: Gale [CpasYgOyyl4]_part_002_chunk3413.mp3
127
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/debate_chunks/Is Legalizing Marijuana a Mistake? Live Debate [v_U4CxB0MlA]/Is L_speaker_SPEAKER_12/Is L_speaker_SPEAKER_12_chunk129.wav
128
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/Ruski_scraped_chunks/youtube/sychev/МАРКЕТОЛОГ. Личный бренд, продвижение в соцсетях и инфопродукты [b-nbsSigkKo]/МАРК_speaker_SPEAKER_01/МАРК_speaker_SPEAKER_01_chunk154_chunks/МАРК_speaker_SPEAKER_01_chunk154_chunk_2.mp3
129
+ /home/ubuntu/respair/data_cache/Final_Persian/اعظم حبیبی/8bf4e08c-28b4-4781-8b72-6ce2d8cdb714/8bf4e08c-28b4-4781-8b72-6ce2d8cdb714_chunk30.mp3
130
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/سمعة شریفة/سمعة شریفة_chunk330.mp3
131
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/HF_temp/games/Disco/Conceptualization Voice Lines (Disco Elysium) [4cFbMy0snYQ]/Conceptualization Voice Lines (Disco Elysium) [4cFbMy0snYQ]_chunk1161.mp3
132
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/مدينة الحب لا يسكنها العقلاء/مدينة الحب لا يسكنها العقلاء_chunk1150.mp3
133
+ /home/ubuntu/respair/data_cache/Final_Persian/بهرام ابراهیمی/97fff66d-e81e-4e91-8782-9db5118ecbc7/97fff66d-e81e-4e91-8782-9db5118ecbc7_chunk24.mp3
134
+ /home/ubuntu/respair/data_cache/English_Final/with_ids/ylac/ylacombe_podcast/Ylacombe_podcast_audio_1636.wav
135
+ /home/ubuntu/respair/data_cache/English_Final/with_ids/ylac/ylacombe_expresso/Ylacombe_Expresso_audio_11326_P3.wav
136
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/audiobooks_25P/Сьюзен Коллинз 1 - Голодные игры_part_001/Сьюз_speaker_SPEAKER_00/Сьюз_speaker_SPEAKER_00_chunk583.mp3
137
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/audiobooks_25P/Клиффорд Саймак - Кукла судьбы_part_003/Клиф_speaker_SPEAKER_05/Клиф_speaker_SPEAKER_05_chunk1632.mp3
138
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/debate_chunks/Does the Effective Altruism Movement Get Giving Right? [e1e_TUbRdlA]/Does_speaker_SPEAKER_02/Does_speaker_SPEAKER_02_chunk364.wav
139
+ /home/ubuntu/respair/jpn/soshy/Japanese/sakura_moyu/01/01011190.wav
140
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/في ديسمبر تنتهي كل الأحلام/في ديسمبر تنتهي كل الأحلام_chunk1404.mp3
141
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم القصص/علامات الحب السبعة/علامات الحب السبعة_chunk1041.mp3
142
+ /home/ubuntu/respair/data_cache/English_Final/with_ids/Ani_speech/audio_6750.wav
143
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/Ruski_scraped_chunks/youtube/vedud/Гордон - Украина, Россия, Ukraine, Russia (English subs) [in7tepc2shg]/Горд_speaker_SPEAKER_03/Горд_speaker_SPEAKER_03_chunk170.mp3
144
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/HF_temp/games/BD3/BG3_Rest/Astrion/BG3 Voice Lines: Astarion (part 1) [THs2r-xB-Rw]_part_000/BG3 Voice Lines: Astarion (part 1) [THs2r-xB-Rw]_part_000_chunk277.mp3
145
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/أرغبه رجلا يا أبي/أرغبه رجلا يا أبي_chunk302.mp3
146
+ /home/ubuntu/respair/jpn/soshy/Japanese/imas_split/nagi/nagi_cgss/nagi_chara_309/nagi_voice_309_4_13.wav
147
+ /home/ubuntu/respair/data_cache/Final_Persian/شهرزاد عالی/4c413c0b-ed80-4d4a-95c4-21147a612d8a/4c413c0b-ed80-4d4a-95c4-21147a612d8a_chunk56.mp3
148
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/audiobooks_25P/Этногенез - Маруся 3_part_001/Этно_speaker_SPEAKER_05/Этно_speaker_SPEAKER_05_chunk295.mp3
149
+ /home/ubuntu/respair/data_cache/Final_Persian/ساعد باقری/b842c75e-7251-441c-852d-fc8cc5c20558/b842c75e-7251-441c-852d-fc8cc5c20558_chunk282.mp3
150
+ /home/ubuntu/respair/jpn/moe/b8b5fe66/wav/b8b5fe66_1892.wav
151
+ /home/ubuntu/respair/data_cache/English_Final/with_ids/ylac/ylacombe_expresso/Ylacombe_Expresso_audio_8528_P3.wav
152
+ /home/ubuntu/respair/data_cache/Final_Persian/اطهر کلانتری/e9d04f1c-5687-422e-8ab7-4db6e95fd8b4/e9d04f1c-5687-422e-8ab7-4db6e95fd8b4_chunk176.mp3
153
+ /home/ubuntu/respair/jpn/soshy/Japanese/tsujido/vo/013/S013_A_0244.wav
154
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم القصص/دفتر الغربة/دفتر الغربة_chunk920.mp3
155
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/Ruski_scraped_chunks/youtube/vedud/Сергей Супонев - друг всех детей ⧸ вДудь [ckyW08MpmHs]/Серг_speaker_SPEAKER_07/Серг_speaker_SPEAKER_07_chunk84.mp3
156
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/HF_temp/games/BD3/BG3_Rest/Karlach/BG3 Voice Lines: Karlach [Enn8zDfS6Es]_part_002/BG3 Voice Lines: Karlach [Enn8zDfS6Es]_part_002_chunk2517.mp3
157
+ /home/ubuntu/respair/data_cache/English_Final/with_ids/Ani_speech/audio_1754.wav
158
+ /home/ubuntu/respair/data_cache/Final_Persian/نازنین آذرسا/3b014b6b-29ee-4ae1-846e-f889cdd2206b/3b014b6b-29ee-4ae1-846e-f889cdd2206b_chunk120.mp3
159
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/audiobooks_25P/Владимир Яценко - Старик и дети/Влад_speaker_SPEAKER_00/Влад_speaker_SPEAKER_00_chunk278.mp3
160
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/لأنها استثناء/لأنها استثناء_chunk347.mp3
161
+ /home/ubuntu/respair/jpn/soshy/Japanese/imas_split/frederica/fredrica_cgss/fredrica_card_100747/fredrica_voice_100747_1_11.wav
162
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم القصص/يا سلمى أنا الآن وحيد /يا سلمى أنا الآن وحيد _chunk798.mp3
163
+ /home/ubuntu/respair/jpn/moe/6d565f54/wav/6d565f54_1248.wav
164
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/HF_temp/games/BD3/BG3_Rest/BG3 Voice Lines: Minsc [5wO9k1rgRcY]/BG3 Voice Lines: Minsc [5wO9k1rgRcY]_chunk3356.mp3
165
+ /home/ubuntu/respair/data_cache/Final_Persian/اشکان عقیلی پور/ef422f57-99b8-40cd-8e22-553025f09d3d/ef422f57-99b8-40cd-8e22-553025f09d3d_chunk131.mp3
166
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/audiobooks_25P/Джек Андерсон - Игра в лево-право/Джек_speaker_SPEAKER_04/Джек_speaker_SPEAKER_04_chunk4173.mp3
167
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/الميلاد/الميلاد_chunk595.mp3
168
+ /home/ubuntu/respair/data_cache/Final_Rusiki/wth_ids/Taiga/Taiga_rus_dataset_audio_5866.wav
169
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/audiobooks_25P/Сьюзен Коллинз 1 - Голодные игры_part_001/Сьюз_speaker_SPEAKER_00/Сьюз_speaker_SPEAKER_00_chunk1319.mp3
170
+ /home/ubuntu/respair/jpn/soshy/Japanese/monogatari/monogatari_voices/monogatari_split/sawashiro_miyuki/Sawashiro_Miyuki_03/Sawashiro_Miyuki_03_chunk752.wav
171
+ /home/ubuntu/respair/data_cache/Final_Persian/بهراد رضازاده/5e04ac82-5ecf-4af5-976f-7fa319e5926d/5e04ac82-5ecf-4af5-976f-7fa319e5926d_chunk187.mp3
172
+ /home/ubuntu/respair/data_cache/Final_Persian/امیررضا علی زاده/d17ab7bd-ebb2-4442-9730-e84726cb90a4/d17ab7bd-ebb2-4442-9730-e84726cb90a4_chunk88.mp3
173
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/ذئاب لا تغفر/ذئاب لا تغفر_chunk1130.mp3
174
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/HF_temp/games/BD3/BG3_Rest/Karlach/BG3 Voice Lines: Karlach [Enn8zDfS6Es]_part_001/BG3 Voice Lines: Karlach [Enn8zDfS6Es]_part_001_chunk2549.mp3
175
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/عشقني عفريت من الجن/عشقني عفريت من الجن_chunk303.mp3
176
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/HF_temp/games/Disco/Authority Voice Lines (Disco Elysium) [lsWdvLZ9Wac]/Authority Voice Lines (Disco Elysium) [lsWdvLZ9Wac]_chunk363.mp3
177
+ /home/ubuntu/respair/data_cache/Final_Persian/مرضیه رحماندوست/3f460bef-ebe3-4407-89ec-61d7956b8d4c/3f460bef-ebe3-4407-89ec-61d7956b8d4c_chunk204.mp3
178
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/فوضى الحواس/فوضى الحواس_chunk1030.mp3
179
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم القصص/كلب عائلة باسكرفيل/كلب عائلة باسكرفيل_chunk1217.mp3
180
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/Ruski_scraped_chunks/youtube/sychev/АЛЕКСАНДР ПАНЧИН. Агностики, соционика и вакцины от коронавируса [PeS8Bh9vizI]/АЛЕК_speaker_SPEAKER_00/АЛЕК_speaker_SPEAKER_00_chunk452.mp3
181
+ /home/ubuntu/respair/data_cache/Final_Persian/ساعد باقری/a37f3bf0-3061-4cd7-a2df-446e507439dc/a37f3bf0-3061-4cd7-a2df-446e507439dc_chunk460.mp3
182
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/HF_temp/games/BD3/BG3_Rest/BG3 Voice Lines: Jaheira [r7HxfsGG0zo]/BG3 Voice Lines: Jaheira [r7HxfsGG0zo]_chunk6181.mp3
183
+ /home/ubuntu/respair/jpn/soshy/Japanese/monogatari/monogatari_voices/monogatari_split/sawashiro_miyuki/Sawashiro_Miyuki_02/Sawashiro_Miyuki_02_chunk489.wav
184
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم القصص/السكابندو وقصص أخرى/السكابندو وقصص أخرى_chunk225.mp3
185
+ /home/ubuntu/respair/data_cache/Final_Persian/حامد فعال/863f0f5f-7f71-4d7a-b286-0587b223d7bf/863f0f5f-7f71-4d7a-b286-0587b223d7bf_chunk214.mp3
186
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/شوق الدرويش/شوق الدرويش_chunk1194.mp3
187
+ /home/ubuntu/respair/jpn/moe/ee093a4f/wav/ee093a4f_1537.wav
188
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/Ruski_scraped_chunks/youtube/sychev/ЛОГОПЕД. Развитие речи, постановка звуков, массаж и подрезание уздечки [ra3U7s-VZzI]/ЛОГО_speaker_SPEAKER_00/ЛОГО_speaker_SPEAKER_00_chunk921.mp3
189
+ /home/ubuntu/respair/data_cache/Final_Persian/کاوه فولادی نسب/4152c4fa-1b13-4854-8e48-fb7914bdea8f/4152c4fa-1b13-4854-8e48-fb7914bdea8f_chunk100.mp3
190
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم القصص/سيدة في خدمتك/سيدة في خدمتك_chunk850.mp3
191
+ /home/ubuntu/respair/data_cache/Final_Persian/فاطمه کمالی/180ad9ff-c82a-45ff-9b34-8d62c4d142fb/180ad9ff-c82a-45ff-9b34-8d62c4d142fb_chunk343.mp3
192
+ /home/ubuntu/respair/data_cache/English_Final/with_ids/ylac/ylacombe_podcast/Ylacombe_podcast_audio_1060_P3.wav
193
+ /home/ubuntu/respair/jpn/soshy/Japanese/imas_split/Syuuko/Syuuko_Events_and_Card/Card_Commyuu/Work_Comyu/Work_Comyu_chunk55.wav
194
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/Ruski_scraped_chunks/inga/inga_clean/Джейн_Анна_15/Джейн_Анна_15_chunk107.mp3
195
+ /home/ubuntu/respair/data_cache/Final_Persian/حسین تسلیمی/f723254c-afd5-45b9-bb2d-f6e24f1d0a69/f723254c-afd5-45b9-bb2d-f6e24f1d0a69_chunk416.mp3
196
+ /home/ubuntu/respair/data_cache/Final_Persian/لاله اکبری/ff57cb36-b8db-4039-bd12-7c37e6011f80/ff57cb36-b8db-4039-bd12-7c37e6011f80_chunk74.mp3
197
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/HF_temp/games/Disco/Morell, the Cryptozoologist Voice Lines (Disco Elysium) [O-ESHKnBNGo]/Morell, the Cryptozoologist Voice Lines (Disco Elysium) [O-ESHKnBNGo]_chunk355.mp3
198
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم القصص/بئر الحرمان/بئر الحرمان_chunk1537.mp3
199
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/Ruski_scraped_chunks/youtube/frame_turner/MORGENSHTERN ‒ ЛИЗА, ГАЛЛЮЦИНАЦИИ, ДЕТСКИЕ ТРАВМЫ, ПРИЧИНА РАЗВОДА И СЕКРЕТ УСПЕХА [g1nVX1oPxHE]/MORG_speaker_SPEAKER_02/MORG_speaker_SPEAKER_02_chunk1023.mp3
200
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/إحدى عشرة دقيقة/إحدى عشرة دقيقة_chunk451.mp3
201
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/قدري أنت/قدري أنت_chunk36.mp3
202
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/Ruski_scraped_chunks/inga/inga_clean/Джейн_Анна_04/Джейн_Анна_04_chunk118.mp3
203
+ /home/ubuntu/respair/jpn/soshy/Japanese/monogatari/monogatari_voices/monogatari_split/shinichiro_miki/Shinichiro_Miki__01/Shinichiro_Miki__01_chunk270.wav
204
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/Ruski_scraped_chunks/youtube/vedud/Лошак – как оставаться журналистом ⧸ Loshak – how to stay a journalist [PWt27h_scaY]/Лоша_speaker_SPEAKER_04/Лоша_speaker_SPEAKER_04_chunk299.mp3
205
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/debate_chunks/Debate: Is Wokeness Killing Comedy? Live - Lou Perez vs. Michael Ian Black [J4Vb53s4I0A]/Deba_speaker_SPEAKER_06/Deba_speaker_SPEAKER_06_chunk23.wav
206
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/أنشودة المقهى الحزين/أ��شودة المقهى الحزين_chunk204.mp3
207
+ /home/ubuntu/respair/data_cache/Final_Persian/تارا تیمورزاده/ac11ca31-2fc5-498c-8c94-5bcd49a76fdb/ac11ca31-2fc5-498c-8c94-5bcd49a76fdb_chunk410.mp3
208
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/Ruski_scraped_chunks/inga/inga_clean/Анна Джейн_21/Анна Джейн_21_chunk358.mp3
209
+ /home/ubuntu/respair/jpn/moe/ad28b91b/wav/ad28b91b_2228.wav
210
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/سوف أحكي عنك /سوف أحكي عنك _chunk297.mp3
211
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/whispering_chunks/ASMR - JANUARY 2023 - Monthly Favourites [9rv-PFYRAho]/ASMR - JANUARY 2023 - Monthly Favourites [9rv-PFYRAho]_chunk280.mp3
212
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/HF_temp/games/Disco/Evrart Claire Voice Lines (Disco Elysium) [3fyCrwXUM3c]/Evrart Claire Voice Lines (Disco Elysium) [3fyCrwXUM3c]_chunk1318.mp3
213
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/HF_temp/games/BD3/BG3_Rest/Karlach/BG3 Voice Lines: Karlach [Enn8zDfS6Es]_part_001/BG3 Voice Lines: Karlach [Enn8zDfS6Es]_part_001_chunk2221.mp3
214
+ /home/ubuntu/respair/jpn/soshy/Japanese/tsujido/vo/004/S004_E_0006.wav
215
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/HF_temp/games/Disco/Kim Kitsuragi Voice Lines (Disco Elyisum) [c5qHI57fkFE]_part_001/Kim Kitsuragi Voice Lines (Disco Elyisum) [c5qHI57fkFE]_part_001_chunk16.mp3
216
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/debate_chunks/Should Courts, Not Campuses, Decide Sexual Assault Cases? [XdH7X9i5NpM]/Shou_speaker_SPEAKER_05/Shou_speaker_SPEAKER_05_chunk63_chunks/Shou_speaker_SPEAKER_05_chunk63_chunk_1.mp3
217
+ /home/ubuntu/respair/data_cache/Final_Persian/آرش راسخ/af8053f2-6a13-4c77-a2a4-c6b01997d6f6/af8053f2-6a13-4c77-a2a4-c6b01997d6f6_chunk509.mp3
218
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/audiobooks_25P/Алексей Калугин - Подмененный 3 - Осколки реальности_part_000/Алек_speaker_SPEAKER_03/Алек_speaker_SPEAKER_03_chunk18.mp3
219
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/HF_temp/games/BD3/BG3_Rest/shadow_heart/BG3 Voice Lines: Shadowheart (part 1) [u95hd47w8pM]_part_000/BG3 Voice Lines: Shadowheart (part 1) [u95hd47w8pM]_part_000_chunk2321.mp3
220
+ /home/ubuntu/respair/data_cache/Final_Persian/نازنین آذرسا/50c24690-436c-475c-93ec-ded918f2f09e/50c24690-436c-475c-93ec-ded918f2f09e_chunk252.mp3
221
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/Ruski_scraped_chunks/youtube/sychev/ГЕШТАЛЬТ ТЕРАПИЯ и осознанность в эмоциях. Как незакрытый гештальт переходит в невроз [_EXkjzgfCi8]/ГЕШТ_speaker_SPEAKER_02/ГЕШТ_speaker_SPEAKER_02_chunk42.mp3
222
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/أوراق الورد/أوراق الورد_chunk440.mp3
223
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/Ruski_scraped_chunks/youtube/sychev/СЕМЕЙНЫЙ ПСИХОЛОГ. Развод, абьюз и феминизм. Сохранять ли брак ради ребёнка? [AeKXCnoEKSA]/СЕМЕ_speaker_SPEAKER_04/СЕМЕ_speaker_SPEAKER_04_chunk760.mp3
224
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/Ruski_scraped_chunks/youtube/frame_turner/ЯНЧИК ‒ ГОЛОСА В ГОЛОВЕ, СТРАХ ОШИБОК, ОКР И ВЫЖИВАНИЕ В ЛЕСУ [czFc_d2tp8I]/ЯНЧИ_speaker_SPEAKER_06/ЯНЧИ_speaker_SPEAKER_06_chunk993.mp3
225
+ /home/ubuntu/respair/jpn/moe/1a5a3db8/wav/1a5a3db8_0215.wav
226
+ /home/ubuntu/respair/jpn/moe/6d565f54/wav/6d565f54_1467.wav
227
+ /home/ubuntu/respair/jpn/soshy/Japanese/imas_split/shiburin/shiburin_cgss/shiburin_card_200071/shiburin_voice_200071_2_11.wav
228
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/audiobooks_25P/Сьюзен Коллинз 1 - Голодные игры_part_002/Сьюз_speaker_SPEAKER_00/Сьюз_speaker_SPEAKER_00_chunk717.mp3
229
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/إيفوريا/إيفوريا_chunk1102.mp3
230
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/HF_temp/games/BD3/BG3_Rest/Laezel/BG3 Voice Lines: Lae'zel [q-Z-9hfSirg]_part_002/BG3 Voice Lines: Lae'zel [q-Z-9hfSirg]_part_002_chunk37.mp3
231
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/debate_chunks/Global Leaders Debate Money, Truth, and Power [ygW1PsuaipY]/Glob_speaker_SPEAKER_07/Glob_speaker_SPEAKER_07_chunk34.wav
232
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/حسناء في المستنقع/حسناء في المستنقع_chunk709.mp3
233
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم القصص/صياد النسيم/صياد النسيم_chunk1384.mp3
234
+ /home/ubuntu/respair/jpn/moe/5d68aedf/wav/5d68aedf_1891.wav
235
+ /home/ubuntu/respair/data_cache/Final_Persian/اشکان عقیلی پور/642bad82-6b0b-474d-b989-b0508cb76adf/642bad82-6b0b-474d-b989-b0508cb76adf_chunk83.mp3
236
+ /home/ubuntu/respair/jpn/moe/5d68aedf/wav/5d68aedf_1025.wav
237
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/شوق الدرويش/شوق الدرويش_chunk504.mp3
238
+ /home/ubuntu/respair/jpn/moe/df6c208e/wav/df6c208e_1504.wav
239
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم القصص/العذراء والشعر الأبيض/العذراء والشعر الأبيض_chunk186.mp3
240
+ /home/ubuntu/respair/data_cache/Final_Persian/گلاره عباسی/bb4764d9-a6bb-44e5-b80d-05033943ea22/bb4764d9-a6bb-44e5-b80d-05033943ea22_chunk25.mp3
241
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/HF_temp/games/BD3/BG3_Rest/Astrion/BG3 Voice Lines: Astarion (part 1) [THs2r-xB-Rw]_part_001/BG3 Voice Lines: Astarion (part 1) [THs2r-xB-Rw]_part_001_chunk15.mp3
242
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم القصص/أيام فاتت/أيام فاتت_chunk669.mp3
243
+ /home/ubuntu/respair/data_cache/Final_Persian/گلچهر دامغانی/ed978bcb-b73c-43b9-8feb-eedb63c9a006/ed978bcb-b73c-43b9-8feb-eedb63c9a006_chunk951.mp3
244
+ /home/ubuntu/respair/data_cache/Final_Persian/مرضیه رحماندوست/a0e913cd-32e4-4410-a613-196de8204050/a0e913cd-32e4-4410-a613-196de8204050_chunk12.mp3
245
+ /home/ubuntu/respair/jpn/soshy/Japanese/tsujido/vo/001/S001_F_0129.wav
246
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/HF_temp/games/BD3/BG3_Rest/shadow_heart/BG3 Voice Lines: Shadowheart (part 2) [PoureCLZNxg]/BG3 Voice Lines: Shadowheart (part 2) [PoureCLZNxg]_chunk2395.mp3
247
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/Ruski_scraped_chunks/youtube/sychev/ЖИЗНЬ С ШИЗОФРЕНИЕЙ-2. Aline in Wonderland. Принудительная госпитализация [iTysDG98Tw8]/ЖИЗН_speaker_SPEAKER_01/ЖИЗН_speaker_SPEAKER_01_chunk699.mp3
248
+ /home/ubuntu/respair/data_cache/Final_Persian/شقایق خاکی پور/d8ade414-0f5a-4333-a9f5-89895d617e4a/d8ade414-0f5a-4333-a9f5-89895d617e4a_chunk631.mp3
249
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/Ruski_scraped_chunks/youtube/sychev/ДОКТОР УТИН. Кофе и сердце, что такое инфаркт, как правильно измерять давление [uXgDhDdDW2g]/ДОКТ_speaker_SPEAKER_04/ДОКТ_speaker_SPEAKER_04_chunk129.mp3
250
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/Ruski_scraped_chunks/youtube/sychev/ПОДРОСТОК о СЕКСЕ. Надо ли родителям разговаривать с детьми? Проблемы в школах [Wo3ZqS01R2w]/ПОДР_speaker_SPEAKER_04/ПОДР_speaker_SPEAKER_04_chunk121.mp3
251
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم القصص/سايكو 2/سايكو 2_chunk494.mp3
252
+ /home/ubuntu/respair/jpn/moe/9febd2ae/wav/9febd2ae_0753.wav
253
+ /home/ubuntu/respair/jpn/soshy/Japanese/monogatari/monogatari_voices/monogatari_split/horie_yui/Horie_Yui_02/Horie_Yui_02_chunk184.wav
254
+ /home/ubuntu/respair/jpn/moe/449d5a0a/wav/449d5a0a_0949.wav
255
+ /home/ubuntu/respair/jpn/moe/95c3bdd8/wav/95c3bdd8_0871.wav
256
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/لكنك لن تعرفي/لكنك لن تعرفي_chunk650.mp3
257
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/Ruski_scraped_chunks/inga/inga_clean/Степанова_41/Степанова_41_chunk1.mp3
258
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم القصص/شیكولاتة بیضاء/شیكولاتة بیضاء_chunk402.mp3
259
+ /home/ubuntu/respair/jpn/soshy/Japanese/imas_split/Kanade/Kanade_voice_home_shinaido_room/kanade_card_200580/kanade_voice_200580_6_05.wav
260
+ /home/ubuntu/respair/data_cache/Final_Persian/نازنین آذرسا/b3aa3650-ab3d-4fef-8c43-76abac9ee044/b3aa3650-ab3d-4fef-8c43-76abac9ee044_chunk148.mp3
261
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/Ruski_scraped_chunks/youtube/sychev/ДОКТОР УТИН. Кофе и сердце, что такое инфаркт, как правильно измерять давление [uXgDhDdDW2g]/ДОКТ_speaker_SPEAKER_02/ДОКТ_speaker_SPEAKER_02_chunk451.mp3
262
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/Ruski_scraped_chunks/inga/inga_clean/Степанова_40/Степанова_40_chunk43.mp3
263
+ /home/ubuntu/respair/data_cache/Final_Persian/مصطفی هرآیینی/e4cc5f9b-523f-49d4-88a3-e432c19fdadb/e4cc5f9b-523f-49d4-88a3-e432c19fdadb_chunk105.mp3
264
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/debate_chunks/Should Courts, Not Campuses, Decide Sexual Assault Cases? [XdH7X9i5NpM]/Shou_speaker_SPEAKER_05/Shou_speaker_SPEAKER_05_chunk58.wav
265
+ /home/ubuntu/respair/jpn/soshy/Japanese/sakura_moyu/05/05000390.wav
266
+ /home/ubuntu/respair/jpn/moe/1cc3c6c0/wav/1cc3c6c0_0223.wav
267
+ /home/ubuntu/respair/jpn/moe/cbe5080e/wav/cbe5080e_0793.wav
268
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم القصص/سيدة في خدمتك/سيدة في خدمتك_chunk999.mp3
269
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/debate_chunks/Agree-to-Disagree: Is True Love a Myth? [78PXedWyBAA]/Agre_speaker_SPEAKER_02/Agre_speaker_SPEAKER_02_chunk27.wav
270
+ /home/ubuntu/respair/jpn/moe/bc778ddb/wav/bc778ddb_0956.wav
271
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/ما تخبئه لنا النجوم/ما تخبئه لنا النجوم_chunk570.mp3
272
+ /home/ubuntu/respair/data_cache/Final_Persian/شهین دخت نجف زاده/d65e3143-dd32-4720-816f-7cbd92fd8bac/d65e3143-dd32-4720-816f-7cbd92fd8bac_chunk98.mp3
273
+ /home/ubuntu/respair/data_cache/Final_Persian/راضیه هاشمی/4d542086-331f-4f79-902f-9e27e5e5217d/4d542086-331f-4f79-902f-9e27e5e5217d_chunk439.mp3
274
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم القصص/شیكولاتة بیضاء/شیكولاتة بیضاء_chunk471.mp3
275
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/HF_temp/games/Disco/Composure Voice Lines (Disco Elysium) [88ib4sPXm2Q]/Composure Voice Lines (Disco Elysium) [88ib4sPXm2Q]_chunk346.mp3
276
+ /home/ubuntu/respair/data_cache/Final_Rusiki/wth_ids/22khz/22khz/audiobook_rus_dataset_22khz_audio_12940.wav
277
+ /home/ubuntu/respair/data_cache/Final_Persian/نرگس رحیمیان/acf1cb92-a813-4580-bf54-1544bd24410d/acf1cb92-a813-4580-bf54-1544bd24410d_chunk878.mp3
278
+ /home/ubuntu/respair/jpn/soshy/Japanese/imas_split/minami/minami_cgss/minami_card_201307/minami_voice_201307_2_02.wav
279
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/بيت ح دد/بيت ح دد_chunk821.mp3
280
+ /home/ubuntu/respair/jpn/soshy/Japanese/monogatari/monogatari_voices/monogatari_split/shinichiro_miki/Shinichiro_Miki_03/Shinichiro_Miki_03_chunk2211.wav
281
+ /home/ubuntu/respair/data_cache/Final_Persian/مهبد قناعت پیشه/8542aeb6-372a-4dfe-970c-c8376bf2a8b6/8542aeb6-372a-4dfe-970c-c8376bf2a8b6_chunk43.mp3
282
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/ردني إليك/ردني إليك_chunk365.mp3
283
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/HF_temp/games/Disco/Shivers Voice Lines (Disco Elysium) [PgHIM3M1Al4]/Shivers Voice Lines (Disco Elysium) [PgHIM3M1Al4]_chunk1312.mp3
284
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم القصص/تقتلني أو أكتبها/تقتلني أو أكتبها_chunk1142.mp3
285
+ /home/ubuntu/respair/jpn/soshy/Japanese/tsujido/vo/004/S004_C_0070.wav
286
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/HF_temp/games/BD3/BG3_Rest/shadow_heart/BG3 Voice Lines: Shadowheart (part 1) [u95hd47w8pM]_part_001/BG3 Voice Lines: Shadowheart (part 1) [u95hd47w8pM]_part_001_chunk894.mp3
287
+ /home/ubuntu/respair/data_cache/Final_Persian/صفا آقاجانی/59968192-7770-4c9f-83ac-83ab686d5649/59968192-7770-4c9f-83ac-83ab686d5649_chunk111.mp3
288
+ /home/ubuntu/respair/data_cache/Final_Persian/مارال نوحی/98447c9c-684c-4043-8f67-95c2d8977053/98447c9c-684c-4043-8f67-95c2d8977053_chunk176.mp3
289
+ /home/ubuntu/respair/data_cache/Final_Persian/پژمان ابوالقاسمی/08226e7f-f4dc-4ba7-a71a-fd526e8572e2/08226e7f-f4dc-4ba7-a71a-fd526e8572e2_chunk717.mp3
290
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/debate_chunks/Debate: Is the FDA Too Cautious? [FSkyfsTL_xw]/Deba_speaker_SPEAKER_03/Deba_speaker_SPEAKER_03_chunk90.wav
291
+ /home/ubuntu/respair/data_cache/Final_Persian/یاسر دعاگو/c2baaef2-faaa-4110-903e-1c5e422a13b1/c2baaef2-faaa-4110-903e-1c5e422a13b1_chunk658.mp3
292
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/باريس بلا ايفل/باريس بلا ايفل_chunk592.mp3
293
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/audiobooks_25P/Сергей Павин - Лавка песочных часов/Серг_speaker_SPEAKER_00/Серг_speaker_SPEAKER_00_chunk139.mp3
294
+ /home/ubuntu/respair/data_cache/Final_Rusiki/wth_ids/Taiga/Taiga_rus_dataset_audio_7198.wav
295
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم القصص/بلاد الطاخ طاخ/بلاد الطاخ طاخ_chunk1234.mp3
296
+ /home/ubuntu/respair/data_cache/Final_Persian/شقایق خاکی پور/d528184f-99d0-4136-99a1-3eab3c4a4166/d528184f-99d0-4136-99a1-3eab3c4a4166_chunk161.mp3
297
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/Ruski_scraped_chunks/inga/inga_clean/Степанова_16/Степанова_16_chunk39.mp3
298
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/لن أنسى/لن أنسى_chunk540.mp3
299
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/Ruski_scraped_chunks/youtube/frame_turner/ЯНЧИК ‒ ГОЛОСА В ГОЛОВЕ, СТРАХ ОШИБОК, ОКР И ВЫЖИВАНИЕ В ЛЕСУ [czFc_d2tp8I]/ЯНЧИ_speaker_SPEAKER_07/ЯНЧИ_speaker_SPEAKER_07_chunk94.mp3
300
+ /home/ubuntu/respair/jpn/soshy/Japanese/sakura_moyu/01/01014470.wav
301
+ /home/ubuntu/respair/data_cache/Final_Persian/بابک مینایی/a519dfd7-140c-4537-bd63-8b71bb70845b/a519dfd7-140c-4537-bd63-8b71bb70845b_chunk114.mp3
302
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/رقصة المرمر/رقصة المرمر_chunk1366.mp3
303
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/سأقذف نفسي أمامك/سأقذف نفسي أمامك_chunk722.mp3
304
+ /home/ubuntu/respair/data_cache/Final_Rusiki/wth_ids/Taiga/Taiga_rus_dataset_audio_3655.wav
305
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم القصص/خبايا العرب/خبايا العرب_chunk1176.mp3
306
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/audiobooks_25P/Клиффорд Саймак - Кукла судьбы_part_003/Клиф_speaker_SPEAKER_05/Клиф_speaker_SPEAKER_05_chunk1177.mp3
307
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/سألقاك هناك/سألقاك هناك_chunk1101.mp3
308
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/Ruski_scraped_chunks/inga/inga_clean/Glava_03/Glava_03_chunk562.mp3
309
+ /home/ubuntu/respair/data_cache/English_Final/with_ids/Ani_speech/audio_6555.wav
310
+ /home/ubuntu/respair/data_cache/Final_Persian/تارا تیمورزاده/ad22083b-b26c-4b6e-9908-3faefdbc298f/ad22083b-b26c-4b6e-9908-3faefdbc298f_chunk364.mp3
311
+ /home/ubuntu/respair/jpn/soshy/Japanese/imas_split/ranko/ranko_cgss/ranko_card_200097/ranko_voice_200097_1_09.wav
312
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم القصص/ولد قليل الأدب/ولد قليل الأدب_chunk1820.mp3
313
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/HF_temp/games/BD3/BG3_Rest/Laezel/BG3 Voice Lines: Lae'zel [q-Z-9hfSirg]_part_003/BG3 Voice Lines: Lae'zel [q-Z-9hfSirg]_part_003_chunk344.mp3
314
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/HF_temp/games/BD3/BG3_Rest/shadow_heart/BG3 Voice Lines: Shadowheart (part 1) [u95hd47w8pM]_part_001/BG3 Voice Lines: Shadowheart (part 1) [u95hd47w8pM]_part_001_chunk631.mp3
315
+ /home/ubuntu/respair/data_cache/Final_Persian/محمد امرایی/0f6832d4-b027-4fba-bcd6-5ef85242bd99/0f6832d4-b027-4fba-bcd6-5ef85242bd99_chunk230.mp3
316
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/أنا سنية و أنت شيعي/أنا سنية و أنت شيعي_chunk641.mp3
317
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/Ruski_scraped_chunks/youtube/sychev/ПЕРИНАТАЛЬНЫЙ ПСИХОЛОГ. Про тикающие часики, ЭКО и аборты. Как пережить потерю ребенка [qhxe6nZ4p4E]/ПЕРИ_speaker_SPEAKER_02/ПЕРИ_speaker_SPEAKER_02_chunk844.mp3
318
+ /home/ubuntu/respair/data_cache/Final_Rusiki/wth_ids/22khz/22khz/audiobook_rus_dataset_22khz_audio_7589.wav
319
+ /home/ubuntu/respair/data_cache/Final_Persian/مهدی صفری/48094592-83d7-4ced-a375-29a7f1a348fe/48094592-83d7-4ced-a375-29a7f1a348fe_chunk260.mp3
320
+ /home/ubuntu/respair/data_cache/Final_Persian/الیاس گرجی/9e40cee4-7270-44f9-8264-052106027a01/9e40cee4-7270-44f9-8264-052106027a01_chunk81.mp3
321
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/Ruski_scraped_chunks/youtube/vedud/Лошак – как оставаться журналистом ⧸ Loshak – how to stay a journalist [PWt27h_scaY]/Лоша_speaker_SPEAKER_03/Лоша_speaker_SPEAKER_03_chunk238.mp3
322
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/HF_temp/games/Disco/Jean Vicquemare Voice Lines (Disco Elysium) [z_7OvqdkmKI]/Jean Vicquemare Voice Lines (Disco Elysium) [z_7OvqdkmKI]_chunk54.mp3
323
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم القصص/اللعبة/اللعبة_chunk520.mp3
324
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم القصص/السكابندو وقصص أخرى/السكابندو وقصص أخرى_chunk1226.mp3
325
+ /home/ubuntu/respair/jpn/moe/46d6bf83/wav/46d6bf83_1389.wav
326
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم القصص/قصص الكتب الخمسة/قصص الكتب الخمسة_chunk253.mp3
327
+ /home/ubuntu/respair/data_cache/Final_Persian/یاسر دعاگو/33a8dea0-1d4c-4e08-9097-3f3906a7b488/33a8dea0-1d4c-4e08-9097-3f3906a7b488_chunk370.mp3
328
+ /home/ubuntu/respair/jpn/soshy/Japanese/monogatari/monogatari_voices/monogatari_split/sawashiro_miyuki/Sawashiro_Miyuki_02/Sawashiro_Miyuki_02_chunk1671.wav
329
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/HF_temp/games/BD3/BG3_Rest/Karlach/BG3 Voice Lines: Karlach [Enn8zDfS6Es]_part_001/BG3 Voice Lines: Karlach [Enn8zDfS6Es]_part_001_chunk211.mp3
330
+ /home/ubuntu/respair/data_cache/Final_Persian/فاطمه کمالی/9046daac-a4ae-4879-b7a0-1f99a8ea757f/9046daac-a4ae-4879-b7a0-1f99a8ea757f_chunk11.mp3
331
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/إفطار عند تيفاني/إفطار عند تيفاني_chunk1416.mp3
332
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/HF_temp/games/Disco/Neha, the Novelty Dicemaker Voice Lines (Disco Elysium) [bSZCBFjQOfo]/Neha, the Novelty Dicemaker Voice Lines (Disco Elysium) [bSZCBFjQOfo]_chunk209.mp3
333
+ /home/ubuntu/respair/jpn/soshy/Japanese/saori/merged_vocals_chunk678.wav
334
+ /home/ubuntu/respair/jpn/moe/00163dc9/wav/00163dc9_1552.wav
335
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/audiobooks_25P/Кеннет Балмер - Страна которой нет на карте/Кенн_speaker_SPEAKER_01/Кенн_speaker_SPEAKER_01_chunk3664.mp3
336
+ /home/ubuntu/respair/data_cache/Final_Persian/آزاده رادمهر/f431b0f5-133a-406f-b8a6-cb42c507ca5d/f431b0f5-133a-406f-b8a6-cb42c507ca5d_chunk134.mp3
337
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/audiobooks_25P/Пол Бэттейджер - Ледяной ад/Пол _speaker_SPEAKER_01/Пол _speaker_SPEAKER_01_chunk564.mp3
338
+ /home/ubuntu/respair/data_cache/Final_Persian/راما قویدل/944535f5-bf56-441d-805a-a48f6fddfc60/944535f5-bf56-441d-805a-a48f6fddfc60_chunk95.mp3
339
+ /home/ubuntu/respair/data_cache/Final_Persian/رضا عمرانی/f2eb7ae4-7e24-45ba-8912-abe6273107bb/f2eb7ae4-7e24-45ba-8912-abe6273107bb_chunk430.mp3
340
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/debate_chunks/Unresolved: The Iran Threat [rdRcyieKBVE]/Unre_speaker_SPEAKER_08/Unre_speaker_SPEAKER_08_chunk156.wav
341
+ /home/ubuntu/respair/data_cache/Final_Persian/مرضیه رحماندوست/981c9d9c-0da8-449c-b826-5ba6ea45311d/981c9d9c-0da8-449c-b826-5ba6ea45311d_chunk135.mp3
342
+ /home/ubuntu/respair/data_cache/English_Final/with_ids/Ani_speech/audio_15398.wav
343
+ /home/ubuntu/respair/data_cache/Final_Persian/یاسین ولی نژاد/a6df8917-be49-4e7f-a52a-3e69b65fdeb6/a6df8917-be49-4e7f-a52a-3e69b65fdeb6_chunk14_chunks/a6df8917-be49-4e7f-a52a-3e69b65fdeb6_chunk14_chunk_3.mp3
344
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم القصص/ليثيوم/ليثيوم_chunk735.mp3
345
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/Ruski_scraped_chunks/inga/inga_clean/Анна Джейн_19/Анна Джейн_19_chunk8.mp3
346
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/HF_temp/games/BD3/BG3_Rest/Laezel/BG3 Voice Lines: Lae'zel [q-Z-9hfSirg]_part_002/BG3 Voice Lines: Lae'zel [q-Z-9hfSirg]_part_002_chunk1108.mp3
347
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/Ruski_scraped_chunks/youtube/frame_turner/MARCELO MIRACLES - 200.000.000 НА ОДЕЖДЕ, МАГАЗИН В ПАРИЖЕ, ПРОДАЖА ТРАВЫ И МИФЫ О ПСИХОЛОГАХ [C9d8v1bv8Sw]/MARC_speaker_SPEAKER_09/MARC_speaker_SPEAKER_09_chunk245.mp3
348
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/audiobooks_25P/Брэндон Сандерсон - Стоп-кадр/Брэн_speaker_SPEAKER_01/Брэн_speaker_SPEAKER_01_chunk353.mp3
349
+ /home/ubuntu/respair/data_cache/Final_Persian/یاشار ابراهیمی/e7181295-35ad-4953-a64d-de56a2cdd063/e7181295-35ad-4953-a64d-de56a2cdd063_chunk171.mp3
350
+ /home/ubuntu/respair/data_cache/English_Final/with_ids/Ani_speech/audio_17443.wav
351
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/بره الدنيا/بره الدنيا_chunk386.mp3
352
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/HF_temp/games/BD3/BG3_Rest/shadow_heart/BG3 Voice Lines: Shadowheart (part 1) [u95hd47w8pM]_part_001/BG3 Voice Lines: Shadowheart (part 1) [u95hd47w8pM]_part_001_chunk837.mp3
353
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم القصص/رفقاء الليل/رفقاء الليل_chunk494.mp3
354
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم القصص/مكتوب/مكتوب_chunk468.mp3
355
+ /home/ubuntu/respair/jpn/moe/18460462/wav/18460462_2321.wav
356
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/ولك العودة/ولك العودة_chunk825.mp3
357
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/audiobooks_25P/Этногенез - Маруся 3_part_003/Этно_speaker_SPEAKER_02/Этно_speaker_SPEAKER_02_chunk1223.mp3
358
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/HF_temp/games/BD3/malady/Baldur's Gate 3 Voice Lines: The Narrator [BcdezgUEnLM]/Baldur's Gate 3 Voice Lines: The Narrator [BcdezgUEnLM]_chunk868.mp3
359
+ /home/ubuntu/respair/jpn/moe/8b6e7173/wav/8b6e7173_0246.wav
360
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/إليك قلبي/إليك قلبي_chunk818.mp3
361
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/audiobooks_25P/Артем Каменистый - Практикантка_part_003/Арте_speaker_SPEAKER_00/Арте_speaker_SPEAKER_00_chunk0.mp3
362
+ /home/ubuntu/respair/data_cache/Final_Rusiki/wth_ids/22khz/22khz/audiobook_rus_dataset_22khz_audio_982.wav
363
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/روح/روح_chunk867.mp3
364
+ /home/ubuntu/respair/data_cache/Final_Persian/پویا پورهمدانی/01d03ce5-d53e-4dad-bf21-78afca9f0183/01d03ce5-d53e-4dad-bf21-78afca9f0183_chunk361.mp3
365
+ /home/ubuntu/respair/jpn/soshy/Japanese/imas_split/fumika/fumika_cgss/fumika_card_200282/fumika_voice_200282_2_09.wav
366
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم القصص/مطلوب حبيب/مطلوب حبيب_chunk937.mp3
367
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/HF_temp/games/BD3/BG3_Rest/Laezel/BG3 Voice Lines: Lae'zel [q-Z-9hfSirg]_part_000/BG3 Voice Lines: Lae'zel [q-Z-9hfSirg]_part_000_chunk1623.mp3
368
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/HF_temp/games/BD3/BG3_Rest/shadow_heart/BG3 Voice Lines: Shadowheart (part 1) [u95hd47w8pM]_part_002/BG3 Voice Lines: Shadowheart (part 1) [u95hd47w8pM]_part_002_chunk616.mp3
369
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم القصص/أكوان/أكوان_chunk12.mp3
370
+ /home/ubuntu/respair/data_cache/English_Final/with_ids/Ani_speech/audio_16020.wav
371
+ /home/ubuntu/respair/data_cache/Final_Persian/ونوس صفری/5e65388c-dd61-4f0c-a7c2-af511dc4b401/5e65388c-dd61-4f0c-a7c2-af511dc4b401_chunk0_chunks/5e65388c-dd61-4f0c-a7c2-af511dc4b401_chunk0_chunk_3.mp3
372
+ /home/ubuntu/respair/data_cache/Final_Persian/شهرزاد عالی/c332cbcf-3eee-4f81-a168-2f3c032dfa4f/c332cbcf-3eee-4f81-a168-2f3c032dfa4f_chunk142.mp3
373
+ /home/ubuntu/respair/jpn/soshy/Japanese/monogatari/monogatari_voices/monogatari_split/sakurai_takahiro/Sakurai_Takahiro_02/Sakurai_Takahiro_02_chunk1544.wav
374
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/debate_chunks/Debate: Will AI Kill the Future of the Creative Arts? Jonathan Taplin vs. Rebecca Fiebrink [J5cz-v0j3D0]/Deba_speaker_SPEAKER_00/Deba_speaker_SPEAKER_00_chunk90.wav
375
+ /home/ubuntu/respair/jpn/soshy/Japanese/imas_split/usamin/usamin_mobamas/usamin_mobamasu_0007/usamin_mobamasu_0007_chunk15.wav
376
+ /home/ubuntu/respair/data_cache/Final_Persian/ساعد باقری/b240e95c-208a-4bb9-8e14-ef924efa9047/b240e95c-208a-4bb9-8e14-ef924efa9047_chunk431.mp3
377
+ /home/ubuntu/respair/jpn/soshy/Japanese/tsujido/vo/009/S009_A_0055.wav
378
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/audiobooks_25P/Клиффорд Саймак - Кукла судьбы_part_002/Клиф_speaker_SPEAKER_04/Клиф_speaker_SPEAKER_04_chunk69.mp3
379
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/Ruski_scraped_chunks/youtube/sychev/МАРКЕТОЛОГ. Личный бренд, продвижение в соцсетях и инфопродукты [b-nbsSigkKo]/МАРК_speaker_SPEAKER_01/МАРК_speaker_SPEAKER_01_chunk194.mp3
380
+ /home/ubuntu/respair/data_cache/English_Final/with_ids/Ani_speech/audio_8349.wav
381
+ /home/ubuntu/respair/data_cache/English_Final/with_ids/ylac/ylacombe_expresso/Ylacombe_Expresso_audio_10948_P3.wav
382
+ /home/ubuntu/respair/jpn/soshy/Japanese/monogatari/monogatari_voices/monogatari_split/shinichiro_miki/Shinichiro_Miki_03/Shinichiro_Miki_03_chunk2008.wav
383
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/audiobooks_25P/Брайдер Юрий - Против течения/Брай_speaker_SPEAKER_00/Брай_speaker_SPEAKER_00_chunk92.mp3
384
+ /home/ubuntu/respair/jpn/soshy/Japanese/imas_split/Syuuko/Syuuko_Mobamas/Syuko Voice/【モバマス】[シンデレラドリーム]塩見周子【ボイス集】 - Niconico Video/【モバマス】[シンデレラドリーム]塩見周子【ボイス集】 - Niconico Video_chunk12.wav
385
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/مجدولين/مجدولين_chunk361.mp3
386
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/أهواك/أهواك_chunk1278.mp3
387
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/HF_temp/games/Disco/Cuno Voice Lines (Disco Elysium) [GI3nSMhAHgU]/Cuno Voice Lines (Disco Elysium) [GI3nSMhAHgU]_chunk235.mp3
388
+ /home/ubuntu/respair/jpn/moe/bbd90363/wav/bbd90363_1058.wav
389
+ /home/ubuntu/respair/data_cache/English_Final/with_ids/Ani_speech/audio_17836.wav
390
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/HF_temp/games/BD3/BG3_Rest/Gale/BG3 Voice Lines: Gale [CpasYgOyyl4]_part_003/BG3 Voice Lines��� Gale [CpasYgOyyl4]_part_003_chunk3147.mp3
391
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/Ruski_scraped_chunks/inga/inga_clean/Анна Джейн_18/Анна Джейн_18_chunk25.mp3
392
+ /home/ubuntu/respair/jpn/soshy/Japanese/monogatari/monogatari_voices/monogatari_split/horie_yui/Horie_Yui_03/Horie_Yui_03_chunk582.wav
393
+ /home/ubuntu/respair/jpn/moe/46d6bf83/wav/46d6bf83_0757.wav
394
+ /home/ubuntu/respair/jpn/moe/8b6e7173/wav/8b6e7173_0888.wav
395
+ /home/ubuntu/respair/data_cache/Final_Persian/مریم محبوب/7232519c-7ce3-45fb-9d4b-01fd9ddaef6e/7232519c-7ce3-45fb-9d4b-01fd9ddaef6e_chunk817.mp3
396
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/audiobooks_25P/Алексей Калугин - Лабиринт 3 - Мир без солнца_part_000/Алек_speaker_SPEAKER_00/Алек_speaker_SPEAKER_00_chunk67.mp3
397
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/HF_temp/games/Disco/Logic Voice Lines (Disco Elysium) [01lD5K990NY]/Logic Voice Lines (Disco Elysium) [01lD5K990NY]_chunk675.mp3
398
+ /home/ubuntu/respair/jpn/soshy/Japanese/tsujido/vo/002/S002_A_0633.wav
399
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/الكرسي الهزاز/الكرسي الهزاز_chunk1063.mp3
400
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/debate_chunks/Debate: We Should Expand the Supreme Court [eb6o-mTZm4o]/Deba_speaker_SPEAKER_02/Deba_speaker_SPEAKER_02_chunk160.wav
401
+ /home/ubuntu/respair/data_cache/Final_Persian/مهرداد محمدپور/7b29e20a-1fda-4c2c-897d-31024969a2ef/7b29e20a-1fda-4c2c-897d-31024969a2ef_chunk23.mp3
402
+ /home/ubuntu/respair/jpn/soshy/Japanese/imas_split/Kanade/Kanade_Events_and_Card/Kanade_Events/Monochrome_lily/Monochrome_lily_chunk245.wav
403
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/HF_temp/games/Disco/Kim Kitsuragi Voice Lines (Disco Elyisum) [c5qHI57fkFE]_part_003/Kim Kitsuragi Voice Lines (Disco Elyisum) [c5qHI57fkFE]_part_003_chunk180.mp3
404
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/الخيط الرفيع/الخيط الرفيع_chunk1325.mp3
405
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/HF_temp/games/Disco/Egg Head Voice Lines (Disco Elysium) [jpEuRSw-R0U]/Egg Head Voice Lines (Disco Elysium) [jpEuRSw-R0U]_chunk76.mp3
406
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/debate_chunks/Open to Debate Mock Trial: Is Trump Guilty in the January 6th Case? Lanny Davis vs Sara Azari [rN5klE6Ul_A]/Open_speaker_SPEAKER_00/Open_speaker_SPEAKER_00_chunk116.wav
407
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/audiobooks_25P/Джек Андерсон - Игра в лево-право/Джек_speaker_SPEAKER_04/Джек_speaker_SPEAKER_04_chunk1898.mp3
408
+ /home/ubuntu/respair/data_cache/English_Final/with_ids/Ani_speech/audio_1783.wav
409
+ /home/ubuntu/respair/jpn/moe/00163dc9/wav/00163dc9_0264.wav
410
+ /home/ubuntu/respair/data_cache/Final_Persian/رضا عمرانی/6809b0ed-aa4f-4ff2-a3e1-78825d4a7146/6809b0ed-aa4f-4ff2-a3e1-78825d4a7146_chunk325.mp3
411
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/audiobooks_25P/Сарко Де Рази - Украденный свет/Сарк_speaker_SPEAKER_00/Сарк_speaker_SPEAKER_00_chunk405.mp3
412
+ /home/ubuntu/respair/jpn/moe/95c3bdd8/wav/95c3bdd8_2219.wav
413
+ /home/ubuntu/respair/data_cache/Final_Persian/تینا میرکریمی/059a1c87-6624-4f75-98c8-f9f92c83fd9c/059a1c87-6624-4f75-98c8-f9f92c83fd9c_chunk238.mp3
414
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/Ruski_scraped_chunks/youtube/vedud/Парфенов - о преемнике, Серебренникове и мате ⧸ вДудь [t6i4ElZV1K0]/Парф_speaker_SPEAKER_04/Парф_speaker_SPEAKER_04_chunk83.mp3
415
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/عشقني عفريت من الجن/عشقني عفريت من الجن_chunk1010.mp3
416
+ /home/ubuntu/respair/data_cache/Final_Persian/محسن زرآبادی پور/e1013cd9-b7fc-4373-9060-404b3fff1e32/e1013cd9-b7fc-4373-9060-404b3fff1e32_chunk161.mp3
417
+ /home/ubuntu/respair/data_cache/Final_Persian/احسان چریکی/1cd3f6cb-2936-42dc-a5f9-f90591f00e96/1cd3f6cb-2936-42dc-a5f9-f90591f00e96_chunk85.mp3
418
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/HF_temp/games/BD3/BG3_Rest/Gale/BG3 Voice Lines: Gale [CpasYgOyyl4]_part_000/BG3 Voice Lines: Gale [CpasYgOyyl4]_part_000_chunk1669.mp3
419
+ /home/ubuntu/respair/jpn/soshy/Japanese/monogatari/monogatari_voices/monogatari_split/shinichiro_miki/Shinichiro_Miki__01/Shinichiro_Miki__01_chunk863.wav
420
+ /home/ubuntu/respair/data_cache/Final_Persian/ساعد باقری/b842c75e-7251-441c-852d-fc8cc5c20558/b842c75e-7251-441c-852d-fc8cc5c20558_chunk800.mp3
421
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/audiobooks_25P/Этногенез - Маруся 3_part_003/Этно_speaker_SPEAKER_02/Этно_speaker_SPEAKER_02_chunk1007.mp3
422
+ /home/ubuntu/respair/data_cache/Final_Persian/ونوس صفری/ddcbcb63-4285-44d9-b305-700e86ae98a6/ddcbcb63-4285-44d9-b305-700e86ae98a6_chunk14_chunks/ddcbcb63-4285-44d9-b305-700e86ae98a6_chunk14_chunk_5.mp3
423
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/debate_chunks/Should Congress Stop Funding the War in Ukraine? [rdtCyiKHtqE]/Shou_speaker_SPEAKER_01/Shou_speaker_SPEAKER_01_chunk12.wav
424
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/Ruski_scraped_chunks/youtube/sychev/МРАКОБЕСИЕ В ПСИХИАТРИИ. Ипохондрия, расстановки по Хеллингеру и холотропное дыхание [T-oKbZtgRN8]/МРАК_speaker_SPEAKER_01/МРАК_speaker_SPEAKER_01_chunk790.mp3
425
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/Ruski_scraped_chunks/youtube/frame_turner/MORGENSHTERN ‒ ЛИЗА, ГАЛЛЮЦИНАЦИИ, ДЕТСКИЕ ТРАВМЫ, ПРИЧИНА РАЗВОДА И СЕКРЕТ УСПЕХА [g1nVX1oPxHE]/MORG_speaker_SPEAKER_02/MORG_speaker_SPEAKER_02_chunk2015.mp3
426
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/ذاكرة الجسد/ذاكرة الجسد_chunk526.mp3
427
+ /home/ubuntu/respair/jpn/soshy/Japanese/imas_split/mio/mio_honda_cgss/mio_honda_card_301000/mio_honda_voice_301000_1_12.wav
428
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/Ruski_scraped_chunks/youtube/sychev/ФАРМАЦЕВТ. Что подмешивают в БАДы? Вакцина от коронавируса [IYPGDU8Am1I]/ФАРМ_speaker_SPEAKER_01/ФАРМ_speaker_SPEAKER_01_chunk21.mp3
429
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/Ruski_scraped_chunks/youtube/sychev/Жизнь с БИПОЛЯРНЫМ РАССТРОЙСТВОМ. Депрессии, гипомании и смешанные фазы [aP1S8MK7lrI]/Жизн_speaker_SPEAKER_03/Жизн_speaker_SPEAKER_03_chunk199.mp3
430
+ /home/ubuntu/respair/data_cache/English_Final/with_ids/ylac/ylacombe_podcast/Ylacombe_podcast_audio_183.wav
431
+ /home/ubuntu/respair/data_cache/English_Final/with_ids/ylac/ylacombe_podcast/Ylacombe_podcast_audio_810_P3.wav
432
+ /home/ubuntu/respair/data_cache/English_Final/with_ids/ylac/ylacombe_expresso/Ylacombe_Expresso_audio_1731_P3.wav
433
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/HF_temp/games/Disco/Esprit de Corps Voice Lines (Disco Elysium) [Dnzg0hMiPls]/Esprit de Corps Voice Lines (Disco Elysium) [Dnzg0hMiPls]_chunk439.mp3
434
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/Ruski_scraped_chunks/inga/inga_clean/Анна Джейн_35/Анна Джейн_35_chunk203.mp3
435
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/debate_chunks/Fast Fashion: Shop or Stop? [GluaE-_C0-Q]/Fast_speaker_SPEAKER_03/Fast_speaker_SPEAKER_03_chunk109.wav
436
+ /home/ubuntu/respair/jpn/soshy/Japanese/tsujido/vo/001/S001_C_0288.wav
437
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/HF_temp/games/BD3/BG3_Rest/Gale/BG3 Voice Lines: Gale [CpasYgOyyl4]_part_001/BG3 Voice Lines: Gale [CpasYgOyyl4]_part_001_chunk2855.mp3
438
+ /home/ubuntu/respair/jpn/soshy/Japanese/tsujido/vo/011/S011_A_3111.wav
439
+ /home/ubuntu/respair/jpn/soshy/Japanese/monogatari/monogatari_voices/monogatari_split/sakurai_takahiro/Sakurai_Takahiro_02/Sakurai_Takahiro_02_chunk1844.wav
440
+ /home/ubuntu/respair/jpn/moe/917feebd/wav/917feebd_2407.wav
441
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/debate_chunks/#Debate: Is Florida Eating New York's Lunch? Bill de Blasio vs. Reihan Salam [Poj2dDr3n-M]/#Deb_speaker_SPEAKER_07/#Deb_speaker_SPEAKER_07_chunk111.wav
442
+ /home/ubuntu/respair/data_cache/English_Final/with_ids/ylac/ylacombe_podcast/Ylacombe_podcast_audio_2207_P2.wav
443
+ /home/ubuntu/respair/data_cache/Final_Persian/حسن آزادی/ab1eea53-b347-42c1-8663-a4691bd04a1a/ab1eea53-b347-42c1-8663-a4691bd04a1a_chunk567.mp3
444
+ /home/ubuntu/respair/jpn/soshy/Japanese/sakura_moyu/03/03013290.wav
445
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/HF_temp/games/BD3/malady/Baldur's Gate 3 Voice Lines: The Narrator [BcdezgUEnLM]/Baldur's Gate 3 Voice Lines: The Narrator [BcdezgUEnLM]_chunk1527.mp3
446
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/HF_temp/games/Disco/Limbic System Voice Lines (Disco Elysium) [ug5DR5ylSPc]/Limbic System Voice Lines (Disco Elysium) [ug5DR5ylSPc]_chunk302.mp3
447
+ /home/ubuntu/respair/jpn/moe/9febd2ae/wav/9febd2ae_1198.wav
448
+ /home/ubuntu/respair/data_cache/Final_Persian/محمد امرایی/a4c4b25a-d6b2-48e2-af9f-c3606a69eae0/a4c4b25a-d6b2-48e2-af9f-c3606a69eae0_chunk382.mp3
449
+ /home/ubuntu/respair/data_cache/Final_Persian/ساعد باقری/8ed4d9cb-ebf4-4f5e-8960-2024091c1b55/8ed4d9cb-ebf4-4f5e-8960-2024091c1b55_chunk482.mp3
450
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم القصص/هكذا تكلم الذئب/هكذا تكلم الذئب_chunk1004.mp3
451
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/ليتنا لم نلتق/ليتنا لم نلتق_chunk1035.mp3
452
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/عشق في بلاد الجليد/عشق في بلاد الجليد_chunk585.mp3
453
+ /home/ubuntu/respair/jpn/moe/ee093a4f/wav/ee093a4f_0084.wav
454
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/Ruski_scraped_chunks/inga/inga_clean/Glava_02/Glava_02_chunk273.mp3
455
+ /home/ubuntu/respair/jpn/soshy/Japanese/tsujido/vo/003/S003_E_0015.wav
456
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/Ruski_scraped_chunks/youtube/sychev/Жизнь с БИПОЛЯРНЫМ РАССТРОЙСТВОМ 2 типа. Урбанистика, TEDx и психоанализ [umei-N44qqI]/Жизн_speaker_SPEAKER_06/Жизн_speaker_SPEAKER_06_chunk388.mp3
457
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم القصص/شفاة صامتة/شفاة صامتة_chunk1274.mp3
458
+ /home/ubuntu/respair/data_cache/English_Final/with_ids/ylac/ylacombe_podcast/Ylacombe_podcast_audio_5478.wav
459
+ /home/ubuntu/respair/data_cache/Final_Persian/منصور ضابطیان/e15de6bb-d0c4-4b73-a72a-bfd153b92c9d/e15de6bb-d0c4-4b73-a72a-bfd153b92c9d_chunk42.mp3
460
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/أنا سنية و أنت شيعي/أنا سنية و أنت شيعي_chunk887.mp3
461
+ /home/ubuntu/respair/jpn/moe/4e2f4ba6/wav/4e2f4ba6_1288.wav
462
+ /home/ubuntu/respair/data_cache/Final_Persian/تینا میرکریمی/aebfec67-14a2-4672-9f31-27cd3b7febc4/aebfec67-14a2-4672-9f31-27cd3b7febc4_chunk178.mp3
463
+ /home/ubuntu/respair/jpn/moe/ad28b91b/wav/ad28b91b_1167.wav
464
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/HF_temp/games/Disco/Cuno Voice Lines (Disco Elysium) [GI3nSMhAHgU]/Cuno Voice Lines (Disco Elysium) [GI3nSMhAHgU]_chunk1663.mp3
465
+ /home/ubuntu/respair/data_cache/Final_Persian/احسان چریکی/ead295e2-d936-4425-89db-150aa5325763/ead295e2-d936-4425-89db-150aa5325763_chunk493.mp3
466
+ /home/ubuntu/respair/jpn/soshy/Japanese/tsujido/vo/003/S003_C_0011.wav
467
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/HF_temp/games/BD3/BG3_Rest/All Vicious Mockery Insults [QhA1NwgnFN8]/All Vicious Mockery Insults [QhA1NwgnFN8]_chunk1488.mp3
468
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/بنت الباشا/بنت الباشا_chunk726.mp3
469
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/HF_temp/games/BD3/BG3_Rest/BG3 Voice Lines: Jaheira [r7HxfsGG0zo]/BG3 Voice Lines: Jaheira [r7HxfsGG0zo]_chunk1383.mp3
470
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/debate_chunks/Will Kamala Harris or Donald Trump be Better for America? [hfoSRFGNykQ]/Will_speaker_SPEAKER_04/Will_speaker_SPEAKER_04_chunk50.wav
471
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم القصص/مريض لن انساه/مريض لن انساه_chunk1308.mp3
472
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/audiobooks_25P/Кейт Лаумер - Король города/Кейт_speaker_SPEAKER_02/Кейт_speaker_SPEAKER_02_chunk931.mp3
473
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم القصص/الحصان الشارد/الحصان الشارد_chunk555.mp3
474
+ /home/ubuntu/respair/data_cache/Final_Rusiki/wth_ids/22khz/22khz/audiobook_rus_dataset_22khz_audio_16379.wav
475
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/HF_temp/games/BD3/BG3_Rest/Gale/BG3 Voice Lines: Gale [CpasYgOyyl4]_part_000/BG3 Voice Lines: Gale [CpasYgOyyl4]_part_000_chunk374.mp3
476
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/audiobooks_25P/Сергей и Марина Дьяченко - Vita Nostra_part_000/Серг_speaker_SPEAKER_01/Серг_speaker_SPEAKER_01_chunk21.mp3
477
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/HF_temp/games/BD3/BG3_Rest/BG3 Voice Lines: Minsc [5wO9k1rgRcY]/BG3 Voice Lines: Minsc [5wO9k1rgRcY]_chunk5377.mp3
478
+ /home/ubuntu/respair/data_cache/Final_Rusiki/wth_ids/22khz/22khz/audiobook_rus_dataset_22khz_audio_304.wav
479
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/رقصة المرمر/رقصة المرمر_chunk738.mp3
480
+ /home/ubuntu/respair/data_cache/English_Final/with_ids/Ani_speech/audio_18630.wav
481
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/ظلال الكولوسيوم/ظلال الكولوسيوم_chunk619.mp3
482
+ /home/ubuntu/respair/data_cache/English_Final/with_ids/Ani_speech/audio_12749.wav
483
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم القصص/أرجوك أعطني هذا الدواء/أرجوك أعطني هذا الدواء_chunk367.mp3
484
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/أنا في أنتظبارك/أنا في أنتظبارك_chunk448.mp3
485
+ /home/ubuntu/respair/data_cache/Final_Persian/حامد فعال/487218ea-d36f-421a-b03d-898cbc3b1bc8/487218ea-d36f-421a-b03d-898cbc3b1bc8_chunk141.mp3
486
+ /home/ubuntu/respair/data_cache/Final_Persian/امیرمحمد صمصامی/92dc1a19-f918-40a5-84ce-ae0ba60aa1e5/92dc1a19-f918-40a5-84ce-ae0ba60aa1e5_chunk229.mp3
487
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/تحت سقف واحد/تحت سقف واحد_chunk1215.mp3
488
+ /home/ubuntu/respair/data_cache/Final_Persian/محمدرضا علی اکبری/f6e7c8b3-f5be-48cb-8a08-34691ab81af6/f6e7c8b3-f5be-48cb-8a08-34691ab81af6_chunk937.mp3
489
+ /home/ubuntu/respair/jpn/soshy/Japanese/tsujido/vo/003/S003_A_0346.wav
490
+ /home/ubuntu/respair/data_cache/Final_Persian/یاسر دعاگو/6f570bc1-d61d-4bee-ad9c-602c6197091c/6f570bc1-d61d-4bee-ad9c-602c6197091c_chunk408.mp3
491
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم القصص/انتحار حمار/انتحار حمار_chunk1353.mp3
492
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/وصال الروح/وصال الروح_chunk241.mp3
493
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/audiobooks_25P/Кеннет Балмер - Страна которой нет на карте/Кенн_speaker_SPEAKER_01/Кенн_speaker_SPEAKER_01_chunk398.mp3
494
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم القصص/النساء لهن أسنان بيضاء/النساء لهن أسنان بيضاء_chunk683.mp3
495
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/audiobooks_25P/Роберт Шекли - Носитель Инфекции/Робе_speaker_SPEAKER_00/Робе_speaker_SPEAKER_00_chunk742.mp3
496
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/HF_temp/games/BD3/BG3_Rest/Gale/BG3 Voice Lines: Gale [CpasYgOyyl4]_part_001/BG3 Voice Lines: Gale [CpasYgOyyl4]_part_001_chunk2653.mp3
497
+ /home/ubuntu/respair/data_cache/English_Final/no_ids/HF_temp/games/Disco/Ancient Reptilian Brain Voice Lines (Disco Elysium) [MOYMRFmEqcg]/Ancient Reptilian Brain Voice Lines (Disco Elysium) [MOYMRFmEqcg]_chunk82.mp3
498
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم القصص/٣٣ بلونة حب/٣٣ بلونة حب_chunk935.mp3
499
+ /home/ubuntu/respair/data_cache/Final_Rusiki/no_ids/Ruski_scraped_chunks/youtube/vedud/Невзоров – о Фараоне и ориентации Милонова ⧸ Alexandr Nevzorov's big interview [zcjKJ7FHDLM]/Невз_speaker_SPEAKER_03/Невз_speaker_SPEAKER_03_chunk730.mp3
500
+ /home/ubuntu/respair/data_cache/Arabic/Processed_chnks/مجموعة كتب صوتية Storytel قسم روايات رومانسية/م لك يوسف/م لك يوسف_chunk619.mp3
vocos/data/filelist2.train ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c912110b830ea4d3d5b7e6a6c3a5660d7c99a36cf2d5fb12033c8abce311b259
3
+ size 90047319
vocos/logs/lightning_logs/version_24/config.yaml ADDED
@@ -0,0 +1,152 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # pytorch_lightning==1.8.6
2
+ seed_everything: 4444
3
+ trainer:
4
+ logger:
5
+ class_path: pytorch_lightning.loggers.TensorBoardLogger
6
+ init_args:
7
+ save_dir: logs/
8
+ name: lightning_logs
9
+ version: null
10
+ log_graph: false
11
+ default_hp_metric: true
12
+ prefix: ''
13
+ sub_dir: null
14
+ logdir: null
15
+ comment: ''
16
+ purge_step: null
17
+ max_queue: 10
18
+ flush_secs: 120
19
+ filename_suffix: ''
20
+ write_to_disk: true
21
+ comet_config:
22
+ disabled: true
23
+ enable_checkpointing: true
24
+ callbacks:
25
+ - class_path: pytorch_lightning.callbacks.LearningRateMonitor
26
+ init_args:
27
+ logging_interval: null
28
+ log_momentum: false
29
+ - class_path: pytorch_lightning.callbacks.ModelSummary
30
+ init_args:
31
+ max_depth: 2
32
+ - class_path: pytorch_lightning.callbacks.ModelCheckpoint
33
+ init_args:
34
+ dirpath: null
35
+ filename: vocos_checkpoint_{epoch}_{step}_{val_loss:.4f}
36
+ monitor: val_loss
37
+ verbose: false
38
+ save_last: true
39
+ save_top_k: 3
40
+ save_weights_only: false
41
+ mode: min
42
+ auto_insert_metric_name: true
43
+ every_n_train_steps: null
44
+ train_time_interval: null
45
+ every_n_epochs: null
46
+ save_on_train_epoch_end: null
47
+ - class_path: vocos.helpers.GradNormCallback
48
+ default_root_dir: null
49
+ gradient_clip_val: null
50
+ gradient_clip_algorithm: null
51
+ num_nodes: 1
52
+ num_processes: null
53
+ devices:
54
+ - 0
55
+ - 1
56
+ gpus: null
57
+ auto_select_gpus: false
58
+ tpu_cores: null
59
+ ipus: null
60
+ enable_progress_bar: true
61
+ overfit_batches: 0.0
62
+ track_grad_norm: -1
63
+ check_val_every_n_epoch: 1
64
+ fast_dev_run: false
65
+ accumulate_grad_batches: null
66
+ max_epochs: null
67
+ min_epochs: null
68
+ max_steps: 2000000
69
+ min_steps: null
70
+ max_time: null
71
+ limit_train_batches: null
72
+ limit_val_batches: 50
73
+ limit_test_batches: null
74
+ limit_predict_batches: null
75
+ val_check_interval: null
76
+ log_every_n_steps: 100
77
+ accelerator: gpu
78
+ strategy: ddp
79
+ sync_batchnorm: false
80
+ precision: 32
81
+ enable_model_summary: true
82
+ num_sanity_val_steps: 2
83
+ resume_from_checkpoint: null
84
+ profiler: null
85
+ benchmark: null
86
+ deterministic: null
87
+ reload_dataloaders_every_n_epochs: 0
88
+ auto_lr_find: false
89
+ replace_sampler_ddp: true
90
+ detect_anomaly: false
91
+ auto_scale_batch_size: false
92
+ plugins: null
93
+ amp_backend: native
94
+ amp_level: null
95
+ move_metrics_to_cpu: false
96
+ multiple_trainloader_mode: max_size_cycle
97
+ inference_mode: true
98
+ model:
99
+ class_path: vocos.experiment.VocosExp
100
+ init_args:
101
+ feature_extractor:
102
+ class_path: vocos.feature_extractors.MelSpectrogramFeatures
103
+ init_args:
104
+ sample_rate: 44100
105
+ n_fft: 2048
106
+ hop_length: 512
107
+ win_length: 2048
108
+ n_mels: 128
109
+ padding: center
110
+ backbone:
111
+ class_path: vocos.models.VocosBackbone
112
+ init_args:
113
+ input_channels: 128
114
+ dim: 512
115
+ intermediate_dim: 1536
116
+ num_layers: 8
117
+ layer_scale_init_value: null
118
+ adanorm_num_embeddings: null
119
+ head:
120
+ class_path: vocos.heads.ISTFTHead
121
+ init_args:
122
+ dim: 512
123
+ n_fft: 2048
124
+ hop_length: 512
125
+ padding: center
126
+ sample_rate: 44100
127
+ initial_learning_rate: 0.0005
128
+ num_warmup_steps: 0
129
+ mel_loss_coeff: 45.0
130
+ mrd_loss_coeff: 0.1
131
+ pretrain_mel_steps: 0
132
+ decay_mel_coeff: false
133
+ evaluate_utmos: true
134
+ evaluate_pesq: true
135
+ evaluate_periodicty: true
136
+ data:
137
+ class_path: vocos.dataset.VocosDataModule
138
+ init_args:
139
+ train_params:
140
+ filelist_path: /home/ubuntu/vocos/data/filelist.train
141
+ sampling_rate: 44100
142
+ num_samples: 65536
143
+ batch_size: 58
144
+ num_workers: 8
145
+ val_params:
146
+ filelist_path: /home/ubuntu/vocos/data/filelist.val
147
+ sampling_rate: 44100
148
+ num_samples: 65536
149
+ batch_size: 16
150
+ num_workers: 8
151
+ optimizer: null
152
+ lr_scheduler: null
vocos/logs/lightning_logs/version_24/events.out.tfevents.1738102892.104-171-202-79 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd6ece1c3c30eafe201be7ae47f1915108cbcaa4c5c86e5ca9a3cc0d73d08d12
3
+ size 824
vocos/logs/lightning_logs/version_24/hparams.yaml ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ sample_rate: 44100
2
+ initial_learning_rate: 0.0005
3
+ num_warmup_steps: 0
4
+ mel_loss_coeff: 45.0
5
+ mrd_loss_coeff: 0.1
6
+ pretrain_mel_steps: 0
7
+ decay_mel_coeff: false
8
+ evaluate_utmos: true
9
+ evaluate_pesq: true
10
+ evaluate_periodicty: true
vocos/logs/lightning_logs/version_25/checkpoints/last.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9b5b8380daa833cc2e56b967c6eeab7c3d4afb2839a0ebcbf0e69ce2ef0caf82
3
+ size 681716271
vocos/logs/lightning_logs/version_25/checkpoints/vocos_checkpoint_epoch=0_step=16634_val_loss=6.2461.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:47ff3d96147a65ce0868c0d5314dd5a47a644aa4849cb05d64c619294c91de86
3
+ size 681715824
vocos/logs/lightning_logs/version_25/checkpoints/vocos_checkpoint_epoch=1_step=33268_val_loss=5.4846.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9b5b8380daa833cc2e56b967c6eeab7c3d4afb2839a0ebcbf0e69ce2ef0caf82
3
+ size 681716271
vocos/logs/lightning_logs/version_25/config.yaml ADDED
@@ -0,0 +1,152 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # pytorch_lightning==1.8.6
2
+ seed_everything: 4444
3
+ trainer:
4
+ logger:
5
+ class_path: pytorch_lightning.loggers.TensorBoardLogger
6
+ init_args:
7
+ save_dir: logs/
8
+ name: lightning_logs
9
+ version: null
10
+ log_graph: false
11
+ default_hp_metric: true
12
+ prefix: ''
13
+ sub_dir: null
14
+ logdir: null
15
+ comment: ''
16
+ purge_step: null
17
+ max_queue: 10
18
+ flush_secs: 120
19
+ filename_suffix: ''
20
+ write_to_disk: true
21
+ comet_config:
22
+ disabled: true
23
+ enable_checkpointing: true
24
+ callbacks:
25
+ - class_path: pytorch_lightning.callbacks.LearningRateMonitor
26
+ init_args:
27
+ logging_interval: null
28
+ log_momentum: false
29
+ - class_path: pytorch_lightning.callbacks.ModelSummary
30
+ init_args:
31
+ max_depth: 2
32
+ - class_path: pytorch_lightning.callbacks.ModelCheckpoint
33
+ init_args:
34
+ dirpath: null
35
+ filename: vocos_checkpoint_{epoch}_{step}_{val_loss:.4f}
36
+ monitor: val_loss
37
+ verbose: false
38
+ save_last: true
39
+ save_top_k: 3
40
+ save_weights_only: false
41
+ mode: min
42
+ auto_insert_metric_name: true
43
+ every_n_train_steps: null
44
+ train_time_interval: null
45
+ every_n_epochs: null
46
+ save_on_train_epoch_end: null
47
+ - class_path: vocos.helpers.GradNormCallback
48
+ default_root_dir: null
49
+ gradient_clip_val: null
50
+ gradient_clip_algorithm: null
51
+ num_nodes: 1
52
+ num_processes: null
53
+ devices:
54
+ - 0
55
+ - 1
56
+ gpus: null
57
+ auto_select_gpus: false
58
+ tpu_cores: null
59
+ ipus: null
60
+ enable_progress_bar: true
61
+ overfit_batches: 0.0
62
+ track_grad_norm: -1
63
+ check_val_every_n_epoch: 1
64
+ fast_dev_run: false
65
+ accumulate_grad_batches: null
66
+ max_epochs: null
67
+ min_epochs: null
68
+ max_steps: 2000000
69
+ min_steps: null
70
+ max_time: null
71
+ limit_train_batches: null
72
+ limit_val_batches: 50
73
+ limit_test_batches: null
74
+ limit_predict_batches: null
75
+ val_check_interval: null
76
+ log_every_n_steps: 100
77
+ accelerator: gpu
78
+ strategy: ddp
79
+ sync_batchnorm: false
80
+ precision: 32
81
+ enable_model_summary: true
82
+ num_sanity_val_steps: 2
83
+ resume_from_checkpoint: null
84
+ profiler: null
85
+ benchmark: null
86
+ deterministic: null
87
+ reload_dataloaders_every_n_epochs: 0
88
+ auto_lr_find: false
89
+ replace_sampler_ddp: true
90
+ detect_anomaly: false
91
+ auto_scale_batch_size: false
92
+ plugins: null
93
+ amp_backend: native
94
+ amp_level: null
95
+ move_metrics_to_cpu: false
96
+ multiple_trainloader_mode: max_size_cycle
97
+ inference_mode: true
98
+ model:
99
+ class_path: vocos.experiment.VocosExp
100
+ init_args:
101
+ feature_extractor:
102
+ class_path: vocos.feature_extractors.MelSpectrogramFeatures
103
+ init_args:
104
+ sample_rate: 44100
105
+ n_fft: 2048
106
+ hop_length: 512
107
+ win_length: 2048
108
+ n_mels: 128
109
+ padding: center
110
+ backbone:
111
+ class_path: vocos.models.VocosBackbone
112
+ init_args:
113
+ input_channels: 128
114
+ dim: 512
115
+ intermediate_dim: 1536
116
+ num_layers: 8
117
+ layer_scale_init_value: null
118
+ adanorm_num_embeddings: null
119
+ head:
120
+ class_path: vocos.heads.ISTFTHead
121
+ init_args:
122
+ dim: 512
123
+ n_fft: 2048
124
+ hop_length: 512
125
+ padding: center
126
+ sample_rate: 44100
127
+ initial_learning_rate: 0.0005
128
+ num_warmup_steps: 0
129
+ mel_loss_coeff: 45.0
130
+ mrd_loss_coeff: 0.1
131
+ pretrain_mel_steps: 0
132
+ decay_mel_coeff: false
133
+ evaluate_utmos: true
134
+ evaluate_pesq: true
135
+ evaluate_periodicty: true
136
+ data:
137
+ class_path: vocos.dataset.VocosDataModule
138
+ init_args:
139
+ train_params:
140
+ filelist_path: /home/ubuntu/vocos/data/filelist.train
141
+ sampling_rate: 44100
142
+ num_samples: 65536
143
+ batch_size: 58
144
+ num_workers: 8
145
+ val_params:
146
+ filelist_path: /home/ubuntu/vocos/data/filelist.val
147
+ sampling_rate: 44100
148
+ num_samples: 65536
149
+ batch_size: 16
150
+ num_workers: 8
151
+ optimizer: null
152
+ lr_scheduler: null
vocos/logs/lightning_logs/version_25/events.out.tfevents.1738103019.104-171-202-79 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f02506aa015b3928338d546f306e461971e99dcb31e66a265d647f63ce46295
3
+ size 7661756
vocos/logs/lightning_logs/version_25/hparams.yaml ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ sample_rate: 44100
2
+ initial_learning_rate: 0.0005
3
+ num_warmup_steps: 0
4
+ mel_loss_coeff: 45.0
5
+ mrd_loss_coeff: 0.1
6
+ pretrain_mel_steps: 0
7
+ decay_mel_coeff: false
8
+ evaluate_utmos: true
9
+ evaluate_pesq: true
10
+ evaluate_periodicty: true
vocos/logs/lightning_logs/version_26/checkpoints/last.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c3720eb1e5ee6c1ba76d45f73b1661c0285705d570ed08ee78263fdd2bb16954
3
+ size 681715888
vocos/logs/lightning_logs/version_26/checkpoints/vocos_checkpoint_epoch=0_step=16634_val_loss=6.8451.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2499f5ade99900680bcc17d2e14987f91661c14cd925c7435c8fcd071323942a
3
+ size 681715824
vocos/logs/lightning_logs/version_26/config.yaml ADDED
@@ -0,0 +1,152 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # pytorch_lightning==1.8.6
2
+ seed_everything: 4444
3
+ trainer:
4
+ logger:
5
+ class_path: pytorch_lightning.loggers.TensorBoardLogger
6
+ init_args:
7
+ save_dir: logs/
8
+ name: lightning_logs
9
+ version: null
10
+ log_graph: false
11
+ default_hp_metric: true
12
+ prefix: ''
13
+ sub_dir: null
14
+ logdir: null
15
+ comment: ''
16
+ purge_step: null
17
+ max_queue: 10
18
+ flush_secs: 120
19
+ filename_suffix: ''
20
+ write_to_disk: true
21
+ comet_config:
22
+ disabled: true
23
+ enable_checkpointing: true
24
+ callbacks:
25
+ - class_path: pytorch_lightning.callbacks.LearningRateMonitor
26
+ init_args:
27
+ logging_interval: null
28
+ log_momentum: false
29
+ - class_path: pytorch_lightning.callbacks.ModelSummary
30
+ init_args:
31
+ max_depth: 2
32
+ - class_path: pytorch_lightning.callbacks.ModelCheckpoint
33
+ init_args:
34
+ dirpath: null
35
+ filename: vocos_checkpoint_{epoch}_{step}_{val_loss:.4f}
36
+ monitor: val_loss
37
+ verbose: false
38
+ save_last: true
39
+ save_top_k: 3
40
+ save_weights_only: false
41
+ mode: min
42
+ auto_insert_metric_name: true
43
+ every_n_train_steps: null
44
+ train_time_interval: null
45
+ every_n_epochs: null
46
+ save_on_train_epoch_end: null
47
+ - class_path: vocos.helpers.GradNormCallback
48
+ default_root_dir: null
49
+ gradient_clip_val: null
50
+ gradient_clip_algorithm: null
51
+ num_nodes: 1
52
+ num_processes: null
53
+ devices:
54
+ - 0
55
+ - 1
56
+ gpus: null
57
+ auto_select_gpus: false
58
+ tpu_cores: null
59
+ ipus: null
60
+ enable_progress_bar: true
61
+ overfit_batches: 0.0
62
+ track_grad_norm: -1
63
+ check_val_every_n_epoch: 1
64
+ fast_dev_run: false
65
+ accumulate_grad_batches: null
66
+ max_epochs: null
67
+ min_epochs: null
68
+ max_steps: 2000000
69
+ min_steps: null
70
+ max_time: null
71
+ limit_train_batches: null
72
+ limit_val_batches: 50
73
+ limit_test_batches: null
74
+ limit_predict_batches: null
75
+ val_check_interval: null
76
+ log_every_n_steps: 100
77
+ accelerator: gpu
78
+ strategy: ddp
79
+ sync_batchnorm: false
80
+ precision: 32
81
+ enable_model_summary: true
82
+ num_sanity_val_steps: 2
83
+ resume_from_checkpoint: null
84
+ profiler: null
85
+ benchmark: null
86
+ deterministic: null
87
+ reload_dataloaders_every_n_epochs: 0
88
+ auto_lr_find: false
89
+ replace_sampler_ddp: true
90
+ detect_anomaly: false
91
+ auto_scale_batch_size: false
92
+ plugins: null
93
+ amp_backend: native
94
+ amp_level: null
95
+ move_metrics_to_cpu: false
96
+ multiple_trainloader_mode: max_size_cycle
97
+ inference_mode: true
98
+ model:
99
+ class_path: vocos.experiment.VocosExp
100
+ init_args:
101
+ feature_extractor:
102
+ class_path: vocos.feature_extractors.MelSpectrogramFeatures
103
+ init_args:
104
+ sample_rate: 44100
105
+ n_fft: 2048
106
+ hop_length: 512
107
+ win_length: 2048
108
+ n_mels: 128
109
+ padding: center
110
+ backbone:
111
+ class_path: vocos.models.VocosBackbone
112
+ init_args:
113
+ input_channels: 128
114
+ dim: 512
115
+ intermediate_dim: 1536
116
+ num_layers: 8
117
+ layer_scale_init_value: null
118
+ adanorm_num_embeddings: null
119
+ head:
120
+ class_path: vocos.heads.ISTFTHead
121
+ init_args:
122
+ dim: 512
123
+ n_fft: 2048
124
+ hop_length: 512
125
+ padding: center
126
+ sample_rate: 44100
127
+ initial_learning_rate: 0.0005
128
+ num_warmup_steps: 0
129
+ mel_loss_coeff: 45.0
130
+ mrd_loss_coeff: 0.1
131
+ pretrain_mel_steps: 0
132
+ decay_mel_coeff: false
133
+ evaluate_utmos: true
134
+ evaluate_pesq: true
135
+ evaluate_periodicty: true
136
+ data:
137
+ class_path: vocos.dataset.VocosDataModule
138
+ init_args:
139
+ train_params:
140
+ filelist_path: /home/ubuntu/vocos/data/filelist.train
141
+ sampling_rate: 44100
142
+ num_samples: 65536
143
+ batch_size: 58
144
+ num_workers: 8
145
+ val_params:
146
+ filelist_path: /home/ubuntu/vocos/data/filelist.val
147
+ sampling_rate: 44100
148
+ num_samples: 65536
149
+ batch_size: 16
150
+ num_workers: 8
151
+ optimizer: null
152
+ lr_scheduler: null
vocos/logs/lightning_logs/version_26/events.out.tfevents.1738103077.104-171-202-79 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:48c17ee2d5df22160ac1d62a41c9db5957f60652875309e4b5f315bf25c0452b
3
+ size 5746663
vocos/logs/lightning_logs/version_26/hparams.yaml ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ sample_rate: 44100
2
+ initial_learning_rate: 0.0005
3
+ num_warmup_steps: 0
4
+ mel_loss_coeff: 45.0
5
+ mrd_loss_coeff: 0.1
6
+ pretrain_mel_steps: 0
7
+ decay_mel_coeff: false
8
+ evaluate_utmos: true
9
+ evaluate_pesq: true
10
+ evaluate_periodicty: true
vocos/logs/lightning_logs/version_27/checkpoints/last.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f9c52539e953c4675d8f68db881f7c7f3afd6abeecc9932b288c71adf3ab487a
3
+ size 681715888
vocos/logs/lightning_logs/version_27/checkpoints/vocos_checkpoint_epoch=0_step=16634_val_loss=6.0317.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3196e7caa913048385c6806a8fce5b7ee675a77bdacc83c3b84f50a9d557581e
3
+ size 681715824
vocos/logs/lightning_logs/version_27/config.yaml ADDED
@@ -0,0 +1,152 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # pytorch_lightning==1.8.6
2
+ seed_everything: 4444
3
+ trainer:
4
+ logger:
5
+ class_path: pytorch_lightning.loggers.TensorBoardLogger
6
+ init_args:
7
+ save_dir: logs/
8
+ name: lightning_logs
9
+ version: null
10
+ log_graph: false
11
+ default_hp_metric: true
12
+ prefix: ''
13
+ sub_dir: null
14
+ logdir: null
15
+ comment: ''
16
+ purge_step: null
17
+ max_queue: 10
18
+ flush_secs: 120
19
+ filename_suffix: ''
20
+ write_to_disk: true
21
+ comet_config:
22
+ disabled: true
23
+ enable_checkpointing: true
24
+ callbacks:
25
+ - class_path: pytorch_lightning.callbacks.LearningRateMonitor
26
+ init_args:
27
+ logging_interval: null
28
+ log_momentum: false
29
+ - class_path: pytorch_lightning.callbacks.ModelSummary
30
+ init_args:
31
+ max_depth: 2
32
+ - class_path: pytorch_lightning.callbacks.ModelCheckpoint
33
+ init_args:
34
+ dirpath: null
35
+ filename: vocos_checkpoint_{epoch}_{step}_{val_loss:.4f}
36
+ monitor: val_loss
37
+ verbose: false
38
+ save_last: true
39
+ save_top_k: 3
40
+ save_weights_only: false
41
+ mode: min
42
+ auto_insert_metric_name: true
43
+ every_n_train_steps: null
44
+ train_time_interval: null
45
+ every_n_epochs: null
46
+ save_on_train_epoch_end: null
47
+ - class_path: vocos.helpers.GradNormCallback
48
+ default_root_dir: null
49
+ gradient_clip_val: null
50
+ gradient_clip_algorithm: null
51
+ num_nodes: 1
52
+ num_processes: null
53
+ devices:
54
+ - 0
55
+ - 1
56
+ gpus: null
57
+ auto_select_gpus: false
58
+ tpu_cores: null
59
+ ipus: null
60
+ enable_progress_bar: true
61
+ overfit_batches: 0.0
62
+ track_grad_norm: -1
63
+ check_val_every_n_epoch: 1
64
+ fast_dev_run: false
65
+ accumulate_grad_batches: null
66
+ max_epochs: null
67
+ min_epochs: null
68
+ max_steps: 2000000
69
+ min_steps: null
70
+ max_time: null
71
+ limit_train_batches: null
72
+ limit_val_batches: 50
73
+ limit_test_batches: null
74
+ limit_predict_batches: null
75
+ val_check_interval: null
76
+ log_every_n_steps: 100
77
+ accelerator: gpu
78
+ strategy: ddp
79
+ sync_batchnorm: false
80
+ precision: 32
81
+ enable_model_summary: true
82
+ num_sanity_val_steps: 2
83
+ resume_from_checkpoint: null
84
+ profiler: null
85
+ benchmark: null
86
+ deterministic: null
87
+ reload_dataloaders_every_n_epochs: 0
88
+ auto_lr_find: false
89
+ replace_sampler_ddp: true
90
+ detect_anomaly: false
91
+ auto_scale_batch_size: false
92
+ plugins: null
93
+ amp_backend: native
94
+ amp_level: null
95
+ move_metrics_to_cpu: false
96
+ multiple_trainloader_mode: max_size_cycle
97
+ inference_mode: true
98
+ model:
99
+ class_path: vocos.experiment.VocosExp
100
+ init_args:
101
+ feature_extractor:
102
+ class_path: vocos.feature_extractors.MelSpectrogramFeatures
103
+ init_args:
104
+ sample_rate: 44100
105
+ n_fft: 2048
106
+ hop_length: 512
107
+ win_length: 2048
108
+ n_mels: 128
109
+ padding: center
110
+ backbone:
111
+ class_path: vocos.models.VocosBackbone
112
+ init_args:
113
+ input_channels: 128
114
+ dim: 512
115
+ intermediate_dim: 1536
116
+ num_layers: 8
117
+ layer_scale_init_value: null
118
+ adanorm_num_embeddings: null
119
+ head:
120
+ class_path: vocos.heads.ISTFTHead
121
+ init_args:
122
+ dim: 512
123
+ n_fft: 2048
124
+ hop_length: 512
125
+ padding: center
126
+ sample_rate: 44100
127
+ initial_learning_rate: 0.0005
128
+ num_warmup_steps: 0
129
+ mel_loss_coeff: 45.0
130
+ mrd_loss_coeff: 0.1
131
+ pretrain_mel_steps: 0
132
+ decay_mel_coeff: false
133
+ evaluate_utmos: true
134
+ evaluate_pesq: true
135
+ evaluate_periodicty: true
136
+ data:
137
+ class_path: vocos.dataset.VocosDataModule
138
+ init_args:
139
+ train_params:
140
+ filelist_path: /home/ubuntu/vocos/data/filelist.train
141
+ sampling_rate: 44100
142
+ num_samples: 65536
143
+ batch_size: 58
144
+ num_workers: 8
145
+ val_params:
146
+ filelist_path: /home/ubuntu/vocos/data/filelist.val
147
+ sampling_rate: 44100
148
+ num_samples: 65536
149
+ batch_size: 16
150
+ num_workers: 8
151
+ optimizer: null
152
+ lr_scheduler: null
vocos/logs/lightning_logs/version_27/events.out.tfevents.1738146591.104-171-202-79 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:57d65dca6e2d50879800973f412ed4da5c334ebfbd70f475dea1988880d1d01e
3
+ size 4136929
vocos/logs/lightning_logs/version_27/hparams.yaml ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ sample_rate: 44100
2
+ initial_learning_rate: 0.0005
3
+ num_warmup_steps: 0
4
+ mel_loss_coeff: 45.0
5
+ mrd_loss_coeff: 0.1
6
+ pretrain_mel_steps: 0
7
+ decay_mel_coeff: false
8
+ evaluate_utmos: true
9
+ evaluate_pesq: true
10
+ evaluate_periodicty: true
vocos/logs/lightning_logs/version_28/config.yaml ADDED
@@ -0,0 +1,152 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # pytorch_lightning==1.8.6
2
+ seed_everything: 4444
3
+ trainer:
4
+ logger:
5
+ class_path: pytorch_lightning.loggers.TensorBoardLogger
6
+ init_args:
7
+ save_dir: logs/
8
+ name: lightning_logs
9
+ version: null
10
+ log_graph: false
11
+ default_hp_metric: true
12
+ prefix: ''
13
+ sub_dir: null
14
+ logdir: null
15
+ comment: ''
16
+ purge_step: null
17
+ max_queue: 10
18
+ flush_secs: 120
19
+ filename_suffix: ''
20
+ write_to_disk: true
21
+ comet_config:
22
+ disabled: true
23
+ enable_checkpointing: true
24
+ callbacks:
25
+ - class_path: pytorch_lightning.callbacks.LearningRateMonitor
26
+ init_args:
27
+ logging_interval: null
28
+ log_momentum: false
29
+ - class_path: pytorch_lightning.callbacks.ModelSummary
30
+ init_args:
31
+ max_depth: 2
32
+ - class_path: pytorch_lightning.callbacks.ModelCheckpoint
33
+ init_args:
34
+ dirpath: null
35
+ filename: vocos_checkpoint_{epoch}_{step}_{val_loss:.4f}
36
+ monitor: val_loss
37
+ verbose: false
38
+ save_last: true
39
+ save_top_k: 3
40
+ save_weights_only: false
41
+ mode: min
42
+ auto_insert_metric_name: true
43
+ every_n_train_steps: null
44
+ train_time_interval: null
45
+ every_n_epochs: null
46
+ save_on_train_epoch_end: null
47
+ - class_path: vocos.helpers.GradNormCallback
48
+ default_root_dir: null
49
+ gradient_clip_val: null
50
+ gradient_clip_algorithm: null
51
+ num_nodes: 1
52
+ num_processes: null
53
+ devices:
54
+ - 0
55
+ - 1
56
+ gpus: null
57
+ auto_select_gpus: false
58
+ tpu_cores: null
59
+ ipus: null
60
+ enable_progress_bar: true
61
+ overfit_batches: 0.0
62
+ track_grad_norm: -1
63
+ check_val_every_n_epoch: 1
64
+ fast_dev_run: false
65
+ accumulate_grad_batches: null
66
+ max_epochs: null
67
+ min_epochs: null
68
+ max_steps: 2000000
69
+ min_steps: null
70
+ max_time: null
71
+ limit_train_batches: null
72
+ limit_val_batches: 50
73
+ limit_test_batches: null
74
+ limit_predict_batches: null
75
+ val_check_interval: null
76
+ log_every_n_steps: 100
77
+ accelerator: gpu
78
+ strategy: ddp
79
+ sync_batchnorm: false
80
+ precision: 32
81
+ enable_model_summary: true
82
+ num_sanity_val_steps: 2
83
+ resume_from_checkpoint: null
84
+ profiler: null
85
+ benchmark: null
86
+ deterministic: null
87
+ reload_dataloaders_every_n_epochs: 0
88
+ auto_lr_find: false
89
+ replace_sampler_ddp: true
90
+ detect_anomaly: false
91
+ auto_scale_batch_size: false
92
+ plugins: null
93
+ amp_backend: native
94
+ amp_level: null
95
+ move_metrics_to_cpu: false
96
+ multiple_trainloader_mode: max_size_cycle
97
+ inference_mode: true
98
+ model:
99
+ class_path: vocos.experiment.VocosExp
100
+ init_args:
101
+ feature_extractor:
102
+ class_path: vocos.feature_extractors.MelSpectrogramFeatures
103
+ init_args:
104
+ sample_rate: 24000
105
+ n_fft: 2048
106
+ hop_length: 300
107
+ win_length: 1200
108
+ n_mels: 80
109
+ padding: center
110
+ backbone:
111
+ class_path: vocos.models.VocosBackbone
112
+ init_args:
113
+ input_channels: 80
114
+ dim: 512
115
+ intermediate_dim: 1536
116
+ num_layers: 8
117
+ layer_scale_init_value: null
118
+ adanorm_num_embeddings: null
119
+ head:
120
+ class_path: vocos.heads.ISTFTHead
121
+ init_args:
122
+ dim: 512
123
+ n_fft: 2048
124
+ hop_length: 300
125
+ padding: center
126
+ sample_rate: 24000
127
+ initial_learning_rate: 0.0005
128
+ num_warmup_steps: 0
129
+ mel_loss_coeff: 45.0
130
+ mrd_loss_coeff: 0.1
131
+ pretrain_mel_steps: 0
132
+ decay_mel_coeff: false
133
+ evaluate_utmos: true
134
+ evaluate_pesq: true
135
+ evaluate_periodicty: true
136
+ data:
137
+ class_path: vocos.dataset.VocosDataModule
138
+ init_args:
139
+ train_params:
140
+ filelist_path: /home/ubuntu/vocos/data/filelist2.train
141
+ sampling_rate: 24000
142
+ num_samples: 57600
143
+ batch_size: 64
144
+ num_workers: 8
145
+ val_params:
146
+ filelist_path: /home/ubuntu/vocos/data/filelist.val
147
+ sampling_rate: 24000
148
+ num_samples: 57600
149
+ batch_size: 16
150
+ num_workers: 8
151
+ optimizer: null
152
+ lr_scheduler: null
vocos/logs/lightning_logs/version_28/events.out.tfevents.1738155430.104-171-202-79 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0b4a7316956f5ead36f26b752c57b4666029b303700a235499d5430b0e1075d2
3
+ size 698760
vocos/logs/lightning_logs/version_28/hparams.yaml ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ sample_rate: 24000
2
+ initial_learning_rate: 0.0005
3
+ num_warmup_steps: 0
4
+ mel_loss_coeff: 45.0
5
+ mrd_loss_coeff: 0.1
6
+ pretrain_mel_steps: 0
7
+ decay_mel_coeff: false
8
+ evaluate_utmos: true
9
+ evaluate_pesq: true
10
+ evaluate_periodicty: true
vocos/metrics/UTMOS.py ADDED
@@ -0,0 +1,223 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import os
2
+
3
+ import fairseq
4
+ import pytorch_lightning as pl
5
+ import requests
6
+ import torch
7
+ import torch.nn as nn
8
+ from tqdm import tqdm
9
+
10
+ UTMOS_CKPT_URL = "https://huggingface.co/spaces/sarulab-speech/UTMOS-demo/resolve/main/epoch%3D3-step%3D7459.ckpt"
11
+ WAV2VEC_URL = "https://huggingface.co/spaces/sarulab-speech/UTMOS-demo/resolve/main/wav2vec_small.pt"
12
+
13
+ """
14
+ UTMOS score, automatic Mean Opinion Score (MOS) prediction system,
15
+ adapted from https://huggingface.co/spaces/sarulab-speech/UTMOS-demo
16
+ """
17
+
18
+
19
+ class UTMOSScore:
20
+ """Predicting score for each audio clip."""
21
+
22
+ def __init__(self, device, ckpt_path="epoch=3-step=7459.ckpt"):
23
+ self.device = device
24
+ filepath = os.path.join(os.path.dirname(__file__), ckpt_path)
25
+ if not os.path.exists(filepath):
26
+ download_file(UTMOS_CKPT_URL, filepath)
27
+ self.model = BaselineLightningModule.load_from_checkpoint(filepath).eval().to(device)
28
+
29
+ def score(self, wavs: torch.Tensor) -> torch.Tensor:
30
+ """
31
+ Args:
32
+ wavs: audio waveform to be evaluated. When len(wavs) == 1 or 2,
33
+ the model processes the input as a single audio clip. The model
34
+ performs batch processing when len(wavs) == 3.
35
+ """
36
+ if len(wavs.shape) == 1:
37
+ out_wavs = wavs.unsqueeze(0).unsqueeze(0)
38
+ elif len(wavs.shape) == 2:
39
+ out_wavs = wavs.unsqueeze(0)
40
+ elif len(wavs.shape) == 3:
41
+ out_wavs = wavs
42
+ else:
43
+ raise ValueError("Dimension of input tensor needs to be <= 3.")
44
+ bs = out_wavs.shape[0]
45
+ batch = {
46
+ "wav": out_wavs,
47
+ "domains": torch.zeros(bs, dtype=torch.int).to(self.device),
48
+ "judge_id": torch.ones(bs, dtype=torch.int).to(self.device) * 288,
49
+ }
50
+ with torch.no_grad():
51
+ output = self.model(batch)
52
+
53
+ return output.mean(dim=1).squeeze(1).cpu().detach() * 2 + 3
54
+
55
+
56
+ def download_file(url, filename):
57
+ """
58
+ Downloads a file from the given URL
59
+
60
+ Args:
61
+ url (str): The URL of the file to download.
62
+ filename (str): The name to save the file as.
63
+ """
64
+ print(f"Downloading file {filename}...")
65
+ response = requests.get(url, stream=True)
66
+ response.raise_for_status()
67
+
68
+ total_size_in_bytes = int(response.headers.get("content-length", 0))
69
+ progress_bar = tqdm(total=total_size_in_bytes, unit="iB", unit_scale=True)
70
+
71
+ with open(filename, "wb") as f:
72
+ for chunk in response.iter_content(chunk_size=8192):
73
+ progress_bar.update(len(chunk))
74
+ f.write(chunk)
75
+
76
+ progress_bar.close()
77
+
78
+
79
+ def load_ssl_model(ckpt_path="wav2vec_small.pt"):
80
+ filepath = os.path.join(os.path.dirname(__file__), ckpt_path)
81
+ if not os.path.exists(filepath):
82
+ download_file(WAV2VEC_URL, filepath)
83
+ SSL_OUT_DIM = 768
84
+ model, cfg, task = fairseq.checkpoint_utils.load_model_ensemble_and_task([filepath])
85
+ ssl_model = model[0]
86
+ ssl_model.remove_pretraining_modules()
87
+ return SSL_model(ssl_model, SSL_OUT_DIM)
88
+
89
+
90
+ class BaselineLightningModule(pl.LightningModule):
91
+ def __init__(self, cfg):
92
+ super().__init__()
93
+ self.cfg = cfg
94
+ self.construct_model()
95
+ self.save_hyperparameters()
96
+
97
+ def construct_model(self):
98
+ self.feature_extractors = nn.ModuleList(
99
+ [load_ssl_model(ckpt_path="wav2vec_small.pt"), DomainEmbedding(3, 128),]
100
+ )
101
+ output_dim = sum([feature_extractor.get_output_dim() for feature_extractor in self.feature_extractors])
102
+ output_layers = [LDConditioner(judge_dim=128, num_judges=3000, input_dim=output_dim)]
103
+ output_dim = output_layers[-1].get_output_dim()
104
+ output_layers.append(
105
+ Projection(hidden_dim=2048, activation=torch.nn.ReLU(), range_clipping=False, input_dim=output_dim)
106
+ )
107
+
108
+ self.output_layers = nn.ModuleList(output_layers)
109
+
110
+ def forward(self, inputs):
111
+ outputs = {}
112
+ for feature_extractor in self.feature_extractors:
113
+ outputs.update(feature_extractor(inputs))
114
+ x = outputs
115
+ for output_layer in self.output_layers:
116
+ x = output_layer(x, inputs)
117
+ return x
118
+
119
+
120
+ class SSL_model(nn.Module):
121
+ def __init__(self, ssl_model, ssl_out_dim) -> None:
122
+ super(SSL_model, self).__init__()
123
+ self.ssl_model, self.ssl_out_dim = ssl_model, ssl_out_dim
124
+
125
+ def forward(self, batch):
126
+ wav = batch["wav"]
127
+ wav = wav.squeeze(1) # [batches, audio_len]
128
+ res = self.ssl_model(wav, mask=False, features_only=True)
129
+ x = res["x"]
130
+ return {"ssl-feature": x}
131
+
132
+ def get_output_dim(self):
133
+ return self.ssl_out_dim
134
+
135
+
136
+ class DomainEmbedding(nn.Module):
137
+ def __init__(self, n_domains, domain_dim) -> None:
138
+ super().__init__()
139
+ self.embedding = nn.Embedding(n_domains, domain_dim)
140
+ self.output_dim = domain_dim
141
+
142
+ def forward(self, batch):
143
+ return {"domain-feature": self.embedding(batch["domains"])}
144
+
145
+ def get_output_dim(self):
146
+ return self.output_dim
147
+
148
+
149
+ class LDConditioner(nn.Module):
150
+ """
151
+ Conditions ssl output by listener embedding
152
+ """
153
+
154
+ def __init__(self, input_dim, judge_dim, num_judges=None):
155
+ super().__init__()
156
+ self.input_dim = input_dim
157
+ self.judge_dim = judge_dim
158
+ self.num_judges = num_judges
159
+ assert num_judges != None
160
+ self.judge_embedding = nn.Embedding(num_judges, self.judge_dim)
161
+ # concat [self.output_layer, phoneme features]
162
+
163
+ self.decoder_rnn = nn.LSTM(
164
+ input_size=self.input_dim + self.judge_dim,
165
+ hidden_size=512,
166
+ num_layers=1,
167
+ batch_first=True,
168
+ bidirectional=True,
169
+ ) # linear?
170
+ self.out_dim = self.decoder_rnn.hidden_size * 2
171
+
172
+ def get_output_dim(self):
173
+ return self.out_dim
174
+
175
+ def forward(self, x, batch):
176
+ judge_ids = batch["judge_id"]
177
+ if "phoneme-feature" in x.keys():
178
+ concatenated_feature = torch.cat(
179
+ (x["ssl-feature"], x["phoneme-feature"].unsqueeze(1).expand(-1, x["ssl-feature"].size(1), -1)), dim=2
180
+ )
181
+ else:
182
+ concatenated_feature = x["ssl-feature"]
183
+ if "domain-feature" in x.keys():
184
+ concatenated_feature = torch.cat(
185
+ (concatenated_feature, x["domain-feature"].unsqueeze(1).expand(-1, concatenated_feature.size(1), -1),),
186
+ dim=2,
187
+ )
188
+ if judge_ids != None:
189
+ concatenated_feature = torch.cat(
190
+ (
191
+ concatenated_feature,
192
+ self.judge_embedding(judge_ids).unsqueeze(1).expand(-1, concatenated_feature.size(1), -1),
193
+ ),
194
+ dim=2,
195
+ )
196
+ decoder_output, (h, c) = self.decoder_rnn(concatenated_feature)
197
+ return decoder_output
198
+
199
+
200
+ class Projection(nn.Module):
201
+ def __init__(self, input_dim, hidden_dim, activation, range_clipping=False):
202
+ super(Projection, self).__init__()
203
+ self.range_clipping = range_clipping
204
+ output_dim = 1
205
+ if range_clipping:
206
+ self.proj = nn.Tanh()
207
+
208
+ self.net = nn.Sequential(
209
+ nn.Linear(input_dim, hidden_dim), activation, nn.Dropout(0.3), nn.Linear(hidden_dim, output_dim),
210
+ )
211
+ self.output_dim = output_dim
212
+
213
+ def forward(self, x, batch):
214
+ output = self.net(x)
215
+
216
+ # range clipping
217
+ if self.range_clipping:
218
+ return self.proj(output) * 2.0 + 3
219
+ else:
220
+ return output
221
+
222
+ def get_output_dim(self):
223
+ return self.output_dim
vocos/metrics/__pycache__/UTMOS.cpython-311.pyc ADDED
Binary file (15 kB). View file
 
vocos/metrics/__pycache__/periodicity.cpython-311.pyc ADDED
Binary file (4.59 kB). View file
 
vocos/metrics/epoch=3-step=7459.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:44c57e3e4135a243b43d2c82b6a693fcd56f15f9ad0e1eb2a8b31fdecd3a49b8
3
+ size 1238128841
vocos/metrics/periodicity.py ADDED
@@ -0,0 +1,105 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import librosa
2
+ import numpy as np
3
+ import torch
4
+ import torchaudio
5
+ import torchcrepe
6
+ from torchcrepe.loudness import REF_DB
7
+
8
+ SILENCE_THRESHOLD = -60
9
+ UNVOICED_THRESHOLD = 0.21
10
+
11
+ """
12
+ Periodicity metrics adapted from https://github.com/descriptinc/cargan
13
+ """
14
+
15
+
16
+ def predict_pitch(
17
+ audio: torch.Tensor, silence_threshold: float = SILENCE_THRESHOLD, unvoiced_treshold: float = UNVOICED_THRESHOLD
18
+ ):
19
+ """
20
+ Predicts pitch and periodicity for the given audio.
21
+
22
+ Args:
23
+ audio (Tensor): The audio waveform.
24
+ silence_threshold (float): The threshold for silence detection.
25
+ unvoiced_treshold (float): The threshold for unvoiced detection.
26
+
27
+ Returns:
28
+ pitch (ndarray): The predicted pitch.
29
+ periodicity (ndarray): The predicted periodicity.
30
+ """
31
+ # torchcrepe inference
32
+ pitch, periodicity = torchcrepe.predict(
33
+ audio,
34
+ fmin=50.0,
35
+ fmax=550,
36
+ sample_rate=torchcrepe.SAMPLE_RATE,
37
+ model="full",
38
+ return_periodicity=True,
39
+ device=audio.device,
40
+ pad=False,
41
+ )
42
+ pitch = pitch.cpu().numpy()
43
+ periodicity = periodicity.cpu().numpy()
44
+
45
+ # Calculate dB-scaled spectrogram and set low energy frames to unvoiced
46
+ hop_length = torchcrepe.SAMPLE_RATE // 100 # default CREPE
47
+ stft = torchaudio.functional.spectrogram(
48
+ audio,
49
+ window=torch.hann_window(torchcrepe.WINDOW_SIZE, device=audio.device),
50
+ n_fft=torchcrepe.WINDOW_SIZE,
51
+ hop_length=hop_length,
52
+ win_length=torchcrepe.WINDOW_SIZE,
53
+ power=2,
54
+ normalized=False,
55
+ pad=0,
56
+ center=False,
57
+ )
58
+
59
+ # Perceptual weighting
60
+ freqs = librosa.fft_frequencies(sr=torchcrepe.SAMPLE_RATE, n_fft=torchcrepe.WINDOW_SIZE)
61
+ perceptual_stft = librosa.perceptual_weighting(stft.cpu().numpy(), freqs) - REF_DB
62
+ silence = perceptual_stft.mean(axis=1) < silence_threshold
63
+
64
+ periodicity[silence] = 0
65
+ pitch[periodicity < unvoiced_treshold] = torchcrepe.UNVOICED
66
+
67
+ return pitch, periodicity
68
+
69
+
70
+ def calculate_periodicity_metrics(y: torch.Tensor, y_hat: torch.Tensor):
71
+ """
72
+ Calculates periodicity metrics for the predicted and true audio data.
73
+
74
+ Args:
75
+ y (Tensor): The true audio data.
76
+ y_hat (Tensor): The predicted audio data.
77
+
78
+ Returns:
79
+ periodicity_loss (float): The periodicity loss.
80
+ pitch_loss (float): The pitch loss.
81
+ f1 (float): The F1 score for voiced/unvoiced classification
82
+ """
83
+ true_pitch, true_periodicity = predict_pitch(y)
84
+ pred_pitch, pred_periodicity = predict_pitch(y_hat)
85
+
86
+ true_voiced = ~np.isnan(true_pitch)
87
+ pred_voiced = ~np.isnan(pred_pitch)
88
+
89
+ periodicity_loss = np.sqrt(((pred_periodicity - true_periodicity) ** 2).mean(axis=1)).mean()
90
+
91
+ # Update pitch rmse
92
+ voiced = true_voiced & pred_voiced
93
+ difference_cents = 1200 * (np.log2(true_pitch[voiced]) - np.log2(pred_pitch[voiced]))
94
+ pitch_loss = np.sqrt((difference_cents ** 2).mean())
95
+
96
+ # voiced/unvoiced precision and recall
97
+ true_positives = (true_voiced & pred_voiced).sum()
98
+ false_positives = (~true_voiced & pred_voiced).sum()
99
+ false_negatives = (true_voiced & ~pred_voiced).sum()
100
+
101
+ precision = true_positives / (true_positives + false_positives)
102
+ recall = true_positives / (true_positives + false_negatives)
103
+ f1 = 2 * precision * recall / (precision + recall)
104
+
105
+ return periodicity_loss, pitch_loss, f1
vocos/metrics/wav2vec_small.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c66c39eaed1b79a61ea8573f71e08f6641ff156b6a8f458cfaab53877dfa4a26
3
+ size 950500491
vocos/notebooks/Bark+Vocos.ipynb ADDED
@@ -0,0 +1,264 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "nbformat": 4,
3
+ "nbformat_minor": 0,
4
+ "metadata": {
5
+ "colab": {
6
+ "private_outputs": true,
7
+ "provenance": [],
8
+ "gpuType": "T4",
9
+ "authorship_tag": "ABX9TyMC53IsYoVJIVijVzw3ADvX",
10
+ "include_colab_link": true
11
+ },
12
+ "kernelspec": {
13
+ "name": "python3",
14
+ "display_name": "Python 3"
15
+ },
16
+ "language_info": {
17
+ "name": "python"
18
+ },
19
+ "accelerator": "GPU"
20
+ },
21
+ "cells": [
22
+ {
23
+ "cell_type": "markdown",
24
+ "metadata": {
25
+ "id": "view-in-github",
26
+ "colab_type": "text"
27
+ },
28
+ "source": [
29
+ "<a href=\"https://colab.research.google.com/github/charactr-platform/vocos/blob/main/notebooks/Bark%2BVocos.ipynb\" target=\"_parent\"><img src=\"https://colab.research.google.com/assets/colab-badge.svg\" alt=\"Open In Colab\"/></a>"
30
+ ]
31
+ },
32
+ {
33
+ "cell_type": "markdown",
34
+ "source": [
35
+ "# Text-to-Audio Synthesis using Bark and Vocos"
36
+ ],
37
+ "metadata": {
38
+ "id": "NuRzVtHDZ_Gl"
39
+ }
40
+ },
41
+ {
42
+ "cell_type": "markdown",
43
+ "source": [
44
+ "In this notebook, we use [Bark](https://github.com/suno-ai/bark) generative model to turn a text prompt into EnCodec audio tokens. These tokens then go through two decoders, EnCodec and Vocos, to reconstruct the audio waveform. Compare the results to discover the differences in audio quality and characteristics."
45
+ ],
46
+ "metadata": {
47
+ "id": "zJFDte0daDAz"
48
+ }
49
+ },
50
+ {
51
+ "cell_type": "markdown",
52
+ "source": [
53
+ "Make sure you have Bark and Vocos installed:"
54
+ ],
55
+ "metadata": {
56
+ "id": "c9omqGDYnajY"
57
+ }
58
+ },
59
+ {
60
+ "cell_type": "code",
61
+ "source": [
62
+ "!pip install git+https://github.com/suno-ai/bark.git\n",
63
+ "!pip install vocos"
64
+ ],
65
+ "metadata": {
66
+ "id": "voH44g90NvtV"
67
+ },
68
+ "execution_count": null,
69
+ "outputs": []
70
+ },
71
+ {
72
+ "cell_type": "markdown",
73
+ "source": [
74
+ "Download and load Bark models"
75
+ ],
76
+ "metadata": {
77
+ "id": "s3cEjOIuj6tq"
78
+ }
79
+ },
80
+ {
81
+ "cell_type": "code",
82
+ "source": [
83
+ "from bark import preload_models\n",
84
+ "\n",
85
+ "preload_models()"
86
+ ],
87
+ "metadata": {
88
+ "id": "1H7XtXRMjxUM"
89
+ },
90
+ "execution_count": null,
91
+ "outputs": []
92
+ },
93
+ {
94
+ "cell_type": "markdown",
95
+ "source": [
96
+ "Download and load Vocos."
97
+ ],
98
+ "metadata": {
99
+ "id": "YO1m0dJ1j-F5"
100
+ }
101
+ },
102
+ {
103
+ "cell_type": "code",
104
+ "source": [
105
+ "from vocos import Vocos\n",
106
+ "import torch\n",
107
+ "\n",
108
+ "device = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\n",
109
+ "vocos = Vocos.from_pretrained(\"charactr/vocos-encodec-24khz\").to(device)"
110
+ ],
111
+ "metadata": {
112
+ "id": "COQYTDDFkBCq"
113
+ },
114
+ "execution_count": null,
115
+ "outputs": []
116
+ },
117
+ {
118
+ "cell_type": "markdown",
119
+ "source": [
120
+ "We are going to reuse `text_to_semantic` from Bark API, but to reconstruct audio waveform with a custom vododer, we need to slightly redefine the API to return `fine_tokens`."
121
+ ],
122
+ "metadata": {
123
+ "id": "--RjqW0rk5JQ"
124
+ }
125
+ },
126
+ {
127
+ "cell_type": "code",
128
+ "execution_count": null,
129
+ "metadata": {
130
+ "id": "OiUsuN2DNl5S"
131
+ },
132
+ "outputs": [],
133
+ "source": [
134
+ "from typing import Optional, Union, Dict\n",
135
+ "\n",
136
+ "import numpy as np\n",
137
+ "from bark.generation import generate_coarse, generate_fine\n",
138
+ "\n",
139
+ "\n",
140
+ "def semantic_to_audio_tokens(\n",
141
+ " semantic_tokens: np.ndarray,\n",
142
+ " history_prompt: Optional[Union[Dict, str]] = None,\n",
143
+ " temp: float = 0.7,\n",
144
+ " silent: bool = False,\n",
145
+ " output_full: bool = False,\n",
146
+ "):\n",
147
+ " coarse_tokens = generate_coarse(\n",
148
+ " semantic_tokens, history_prompt=history_prompt, temp=temp, silent=silent, use_kv_caching=True\n",
149
+ " )\n",
150
+ " fine_tokens = generate_fine(coarse_tokens, history_prompt=history_prompt, temp=0.5)\n",
151
+ "\n",
152
+ " if output_full:\n",
153
+ " full_generation = {\n",
154
+ " \"semantic_prompt\": semantic_tokens,\n",
155
+ " \"coarse_prompt\": coarse_tokens,\n",
156
+ " \"fine_prompt\": fine_tokens,\n",
157
+ " }\n",
158
+ " return full_generation\n",
159
+ " return fine_tokens"
160
+ ]
161
+ },
162
+ {
163
+ "cell_type": "markdown",
164
+ "source": [
165
+ "Let's create a text prompt and generate audio tokens:"
166
+ ],
167
+ "metadata": {
168
+ "id": "Cv8KCzXlmoF9"
169
+ }
170
+ },
171
+ {
172
+ "cell_type": "code",
173
+ "source": [
174
+ "from bark import text_to_semantic\n",
175
+ "\n",
176
+ "history_prompt = None\n",
177
+ "text_prompt = \"So, you've heard about neural vocoding? [laughs] We've been messing around with this new model called Vocos.\"\n",
178
+ "semantic_tokens = text_to_semantic(text_prompt, history_prompt=history_prompt, temp=0.7, silent=False,)\n",
179
+ "audio_tokens = semantic_to_audio_tokens(\n",
180
+ " semantic_tokens, history_prompt=history_prompt, temp=0.7, silent=False, output_full=False,\n",
181
+ ")"
182
+ ],
183
+ "metadata": {
184
+ "id": "pDmSTutoOH_G"
185
+ },
186
+ "execution_count": null,
187
+ "outputs": []
188
+ },
189
+ {
190
+ "cell_type": "markdown",
191
+ "source": [
192
+ "Reconstruct audio waveform with EnCodec:"
193
+ ],
194
+ "metadata": {
195
+ "id": "UYMzI8svTNqI"
196
+ }
197
+ },
198
+ {
199
+ "cell_type": "code",
200
+ "source": [
201
+ "from bark.generation import codec_decode\n",
202
+ "from IPython.display import Audio\n",
203
+ "\n",
204
+ "encodec_output = codec_decode(audio_tokens)\n",
205
+ "\n",
206
+ "import torchaudio\n",
207
+ "# Upsample to 44100 Hz for better reproduction on audio hardware\n",
208
+ "encodec_output = torchaudio.functional.resample(torch.from_numpy(encodec_output), orig_freq=24000, new_freq=44100)\n",
209
+ "Audio(encodec_output, rate=44100)"
210
+ ],
211
+ "metadata": {
212
+ "id": "PzdytlXFTNQ2"
213
+ },
214
+ "execution_count": null,
215
+ "outputs": []
216
+ },
217
+ {
218
+ "cell_type": "markdown",
219
+ "source": [
220
+ "Reconstruct with Vocos:"
221
+ ],
222
+ "metadata": {
223
+ "id": "BhUxBuP9TTTw"
224
+ }
225
+ },
226
+ {
227
+ "cell_type": "code",
228
+ "source": [
229
+ "audio_tokens_torch = torch.from_numpy(audio_tokens).to(device)\n",
230
+ "features = vocos.codes_to_features(audio_tokens_torch)\n",
231
+ "vocos_output = vocos.decode(features, bandwidth_id=torch.tensor([2], device=device)) # 6 kbps\n",
232
+ "# Upsample to 44100 Hz for better reproduction on audio hardware\n",
233
+ "vocos_output = torchaudio.functional.resample(vocos_output, orig_freq=24000, new_freq=44100).cpu()\n",
234
+ "Audio(vocos_output.numpy(), rate=44100)"
235
+ ],
236
+ "metadata": {
237
+ "id": "8hzSWQ5-nBlV"
238
+ },
239
+ "execution_count": null,
240
+ "outputs": []
241
+ },
242
+ {
243
+ "cell_type": "markdown",
244
+ "source": [
245
+ "Optionally save to mp3 files:"
246
+ ],
247
+ "metadata": {
248
+ "id": "RjVXQIZRb1Re"
249
+ }
250
+ },
251
+ {
252
+ "cell_type": "code",
253
+ "source": [
254
+ "torchaudio.save(\"encodec.mp3\", encodec_output[None, :], 44100, compression=128)\n",
255
+ "torchaudio.save(\"vocos.mp3\", vocos_output, 44100, compression=128)"
256
+ ],
257
+ "metadata": {
258
+ "id": "PLFXpjUKb3WX"
259
+ },
260
+ "execution_count": null,
261
+ "outputs": []
262
+ }
263
+ ]
264
+ }
vocos/requirements-train.txt ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ pytorch_lightning==1.8.6
2
+ jsonargparse[signatures]
3
+ transformers
4
+ torchcrepe
5
+ pesq
6
+ matplotlib==3.7.0
7
+ conda install conda-forge::sox -y
8
+ git+https://github.com/One-sixth/fairseq.git
vocos/requirements.txt ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ torch
2
+ torchaudio
3
+ numpy
4
+ scipy
5
+ einops
6
+ pyyaml
7
+ huggingface_hub
8
+ encodec==0.1.1
vocos/setup.py ADDED
@@ -0,0 +1,39 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import io
2
+ import os
3
+
4
+ from setuptools import find_packages, setup
5
+
6
+ for line in open("vocos/__init__.py"):
7
+ line = line.strip()
8
+ if "__version__" in line:
9
+ context = {}
10
+ exec(line, context)
11
+ VERSION = context["__version__"]
12
+
13
+
14
+ def read(*paths, **kwargs):
15
+ content = ""
16
+ with io.open(
17
+ os.path.join(os.path.dirname(__file__), *paths), encoding=kwargs.get("encoding", "utf8"),
18
+ ) as open_file:
19
+ content = open_file.read().strip()
20
+ return content
21
+
22
+
23
+ def read_requirements(path):
24
+ return [line.strip() for line in read(path).split("\n") if not line.startswith(('"', "#", "-", "git+"))]
25
+
26
+
27
+ setup(
28
+ name="vocos",
29
+ version=VERSION,
30
+ author="Hubert Siuzdak",
31
+ author_email="[email protected]",
32
+ description="Fourier-based neural vocoder for high-quality audio synthesis",
33
+ url="https://github.com/charactr-platform/vocos",
34
+ long_description=read("README.md"),
35
+ long_description_content_type="text/markdown",
36
+ packages=find_packages(),
37
+ install_requires=read_requirements("requirements.txt"),
38
+ extras_require={"train": read_requirements("requirements-train.txt")},
39
+ )
vocos/train.py ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ from pytorch_lightning.cli import LightningCLI
2
+
3
+
4
+ if __name__ == "__main__":
5
+ cli = LightningCLI(run=False)
6
+ cli.trainer.fit(model=cli.model, datamodule=cli.datamodule)
vocos/vocos/__init__.py ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ from vocos.pretrained import Vocos
2
+
3
+
4
+ __version__ = "0.1.0"
vocos/vocos/__pycache__/__init__.cpython-311.pyc ADDED
Binary file (234 Bytes). View file
 
vocos/vocos/__pycache__/dataset.cpython-311.pyc ADDED
Binary file (5.68 kB). View file
 
vocos/vocos/__pycache__/discriminators.cpython-311.pyc ADDED
Binary file (15.2 kB). View file