Spaces:
Running
on
Zero
Running
on
Zero
Upload folder using huggingface_hub
Browse files
soulxpodcast/utils/dataloader.py
CHANGED
|
@@ -123,7 +123,7 @@ class PodcastDataset(Dataset):
|
|
| 123 |
prompt_text_ids = self.text_tokenizer.encode(prompt_text)
|
| 124 |
prompt_text_ids_list.append(prompt_text_ids)
|
| 125 |
if use_dialect_prompt:
|
| 126 |
-
import pdb; pdb.set_trace()
|
| 127 |
dialect_prompt_text = normalize_text(data["dialect_prompt_text"][spk_idx])
|
| 128 |
dialect_prompt_text = f"{SPK_DICT[spk_idx]}{TEXT_START}{dialect_prompt_text}{TEXT_END}{AUDIO_START}"
|
| 129 |
dialect_prompt_text_ids = self.text_tokenizer.encode(dialect_prompt_text)
|
|
|
|
| 123 |
prompt_text_ids = self.text_tokenizer.encode(prompt_text)
|
| 124 |
prompt_text_ids_list.append(prompt_text_ids)
|
| 125 |
if use_dialect_prompt:
|
| 126 |
+
# import pdb; pdb.set_trace()
|
| 127 |
dialect_prompt_text = normalize_text(data["dialect_prompt_text"][spk_idx])
|
| 128 |
dialect_prompt_text = f"{SPK_DICT[spk_idx]}{TEXT_START}{dialect_prompt_text}{TEXT_END}{AUDIO_START}"
|
| 129 |
dialect_prompt_text_ids = self.text_tokenizer.encode(dialect_prompt_text)
|