add new phoneme mode;
Browse files
app.py
CHANGED
@@ -25,7 +25,7 @@ transformation = jiwer.Compose([
|
|
25 |
from transformers import Wav2Vec2Processor, Wav2Vec2ForCTC
|
26 |
processor = Wav2Vec2Processor.from_pretrained("vitouphy/wav2vec2-xls-r-300m-timit-phoneme")
|
27 |
model = Wav2Vec2ForCTC.from_pretrained("vitouphy/wav2vec2-xls-r-300m-timit-phoneme")
|
28 |
-
|
29 |
class ChangeSampleRate(nn.Module):
|
30 |
def __init__(self, input_rate: int, output_rate: int):
|
31 |
super().__init__()
|
|
|
25 |
from transformers import Wav2Vec2Processor, Wav2Vec2ForCTC
|
26 |
processor = Wav2Vec2Processor.from_pretrained("vitouphy/wav2vec2-xls-r-300m-timit-phoneme")
|
27 |
model = Wav2Vec2ForCTC.from_pretrained("vitouphy/wav2vec2-xls-r-300m-timit-phoneme")
|
28 |
+
phoneme_model = pipeline(model="vitouphy/wav2vec2-xls-r-300m-timit-phoneme")
|
29 |
class ChangeSampleRate(nn.Module):
|
30 |
def __init__(self, input_rate: int, output_rate: int):
|
31 |
super().__init__()
|