Compare commits

...

2 commits

Author SHA1 Message Date
2d908e60a5 Add logging to tts gen 2025-03-09 15:55:25 -07:00
d53508c158 Fix audio stretching behavior attempt 2 2025-03-09 15:55:06 -07:00
2 changed files with 3 additions and 1 deletions

View file

@ -53,7 +53,7 @@ class Clip:
def stretch(self, speed, keep_pitch=True):
if keep_pitch:
stretched = tsm.wsola(self._stereo_transpose(self.raw), speed)
stretched = tsm.wsola(self._stereo_transpose(self.raw), 1 / speed)
else:
stretched = librosa.resample(self._stereo_transpose(self.raw), self.samplerate * speed, self.samplerate, fix=False, scale=True)
self.raw = np.ascontiguousarray(self._stereo_transpose(stretched), dtype='float32')

View file

@ -74,12 +74,14 @@ class TextToSpeechPlugin(PluginBase):
if filename is None:
filename = os.path.join(self.cache_dir, f'{uuid.uuid1()}.wav')
self.logger.info(f'Generating TTS "{text}"...')
if self.speaker_wav:
wav = self.synthesizer.tts(text, None, 'en', self.speaker_wav)
else:
wav = self.synthesizer.tts(text)
self.synthesizer.save_wav(wav, filename)
self.logger.info(f'Done - saved as {filename}')
return filename
async def run(self, text, *args, _ctx={}, wait=False, **kwargs):