ai-pronunciation-trainer / RuleBasedModels.py
alessandro trinca tornidor
feat: port whisper and faster-whisper support from https://github.com/Thiagohgl/ai-pronunciation-trainer
85b7206
raw
history blame
1.18 kB
import ModelInterfaces
import torch
import numpy as np
import epitran
import eng_to_ipa
def get_phonem_converter(language: str):
if language == 'de':
phonem_converter = EpitranPhonemConverter(
epitran.Epitran('deu-Latn'))
elif language == 'en':
phonem_converter = EngPhonemConverter()
else:
raise ValueError('Language not implemented')
return phonem_converter
class EpitranPhonemConverter(ModelInterfaces.ITextToPhonemModel):
word_locations_in_samples = None
audio_transcript = None
def __init__(self, epitran_model) -> None:
super().__init__()
self.epitran_model = epitran_model
def convertToPhonem(self, sentence: str) -> str:
phonem_representation = self.epitran_model.transliterate(sentence)
return phonem_representation
class EngPhonemConverter(ModelInterfaces.ITextToPhonemModel):
def __init__(self,) -> None:
super().__init__()
def convertToPhonem(self, sentence: str) -> str:
phonem_representation = eng_to_ipa.convert(sentence)
phonem_representation = phonem_representation.replace('*','')
return phonem_representation