Spaces:

sarinam
/

speaker-anonymization-gan

Running

Initial commit

dcd7182 about 2 years ago

772 Bytes

	from IMSToucan.InferenceInterfaces.AnonFastSpeech2 import AnonFastSpeech2


	class DemoTTS:

	def __init__(self, model_paths, device):
	self.device = device
	fastspeech_path = model_paths / 'FastSpeech2_Multi' / 'trained_on_ground_truth_phonemes.pt'
	hifigan_path = model_paths / 'HiFiGAN_combined' / 'best.pt'
	self.model = AnonFastSpeech2(device=self.device, path_to_hifigan_model=hifigan_path,
	path_to_fastspeech_model=fastspeech_path)

	def read_text(self, transcription, speaker_embedding, text_is_phonemes=False):
	self.model.default_utterance_embedding = speaker_embedding.to(self.device)
	wav = self.model(text=transcription, text_is_phonemes=text_is_phonemes)
	return wav