We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 7ae9d17 commit 9e51888Copy full SHA for 9e51888
Preprocessing/TextFrontend.py
@@ -355,6 +355,7 @@ def postprocess_phoneme_string(self, phoneme_string, for_feature_extraction, inc
355
("ɬ", "s"), # lateral
356
("ɮ", "z"), # lateral
357
('ɺ', 'ɾ'), # lateral
358
+ ('ʲ', 'j'), # decomposed palatalization
359
('\u02CC', ""), # secondary stress
360
('\u030B', "˥"),
361
('\u0301', "˦"),
@@ -380,7 +381,7 @@ def postprocess_phoneme_string(self, phoneme_string, for_feature_extraction, inc
380
381
]
382
unsupported_ipa_characters = {'̹', '̙', '̞', '̯', '̤', '̪', '̩', '̠', '̟', 'ꜜ',
383
'̬', '̽', 'ʰ', '|', '̝', '•', 'ˠ', '↘',
- '‖', '̰', '‿', 'ᷝ', '̈', 'ᷠ', '̜', 'ʷ', 'ʲ',
384
+ '‖', '̰', '‿', 'ᷝ', '̈', 'ᷠ', '̜', 'ʷ',
385
'̚', '↗', 'ꜛ', '̻', '̥', 'ˁ', '̘', '͡', '̺'}
386
# TODO support more of these. Problem: bridge over to aligner ID lookups after modifying the feature vector
387
# https://en.wikipedia.org/wiki/IPA_number
0 commit comments