(self, batch_size, r, bgs, start_by_longest=False)
| 45 | self.ap = AudioProcessor(**c.audio) |
| 46 | |
| 47 | def _create_dataloader(self, batch_size, r, bgs, start_by_longest=False): |
| 48 | # load dataset |
| 49 | meta_data_train, meta_data_eval = load_tts_samples(dataset_config, eval_split=True, eval_split_size=0.2) |
| 50 | items = meta_data_train + meta_data_eval |
| 51 | |
| 52 | tokenizer, _ = TTSTokenizer.init_from_config(c) |
| 53 | dataset = TTSDataset( |
| 54 | outputs_per_step=r, |
| 55 | compute_linear_spec=True, |
| 56 | return_wav=True, |
| 57 | tokenizer=tokenizer, |
| 58 | ap=self.ap, |
| 59 | samples=items, |
| 60 | batch_group_size=bgs, |
| 61 | min_text_len=c.min_text_len, |
| 62 | max_text_len=c.max_text_len, |
| 63 | min_audio_len=c.min_audio_len, |
| 64 | max_audio_len=c.max_audio_len, |
| 65 | start_by_longest=start_by_longest, |
| 66 | ) |
| 67 | dataloader = DataLoader( |
| 68 | dataset, |
| 69 | batch_size=batch_size, |
| 70 | shuffle=False, |
| 71 | collate_fn=dataset.collate_fn, |
| 72 | drop_last=True, |
| 73 | num_workers=c.num_loader_workers, |
| 74 | ) |
| 75 | return dataloader, dataset |
| 76 | |
| 77 | def test_loader(self): |
| 78 | if ok_ljspeech: |
no test coverage detected