2019-01-27 23:52:33 +01:00
|
|
|
|
""" definition of the phones to be used. """
|
|
|
|
|
|
|
|
|
|
## phones in IPA.
|
2019-01-27 01:34:04 +01:00
|
|
|
|
phoneset_ipa = [
|
|
|
|
|
# vowels
|
|
|
|
|
'i̯',
|
2019-01-27 23:52:33 +01:00
|
|
|
|
'i̯ⁿ',
|
2019-01-27 01:34:04 +01:00
|
|
|
|
'y',
|
|
|
|
|
'i',
|
2019-01-27 23:52:33 +01:00
|
|
|
|
'i.',
|
|
|
|
|
'iⁿ',
|
2019-01-27 01:34:04 +01:00
|
|
|
|
'i:',
|
2019-01-27 23:52:33 +01:00
|
|
|
|
'i:ⁿ',
|
2019-01-27 01:34:04 +01:00
|
|
|
|
'ɪ',
|
2019-01-27 23:52:33 +01:00
|
|
|
|
'ɪⁿ',
|
|
|
|
|
'ɪ.',
|
|
|
|
|
#'ɪ:', # not included in lex.ipa
|
|
|
|
|
'ɪ:ⁿ',
|
2019-01-27 01:34:04 +01:00
|
|
|
|
'e',
|
|
|
|
|
'e:',
|
2019-01-27 23:52:33 +01:00
|
|
|
|
'e:ⁿ',
|
2019-01-27 01:34:04 +01:00
|
|
|
|
'ə',
|
2019-01-27 23:52:33 +01:00
|
|
|
|
'əⁿ',
|
2019-01-27 01:34:04 +01:00
|
|
|
|
'ə:',
|
|
|
|
|
'ɛ',
|
2019-01-27 23:52:33 +01:00
|
|
|
|
'ɛ.',
|
|
|
|
|
'ɛⁿ',
|
2019-01-27 01:34:04 +01:00
|
|
|
|
'ɛ:',
|
2019-01-27 23:52:33 +01:00
|
|
|
|
'ɛ:ⁿ',
|
2019-01-27 01:34:04 +01:00
|
|
|
|
'a',
|
2019-01-27 23:52:33 +01:00
|
|
|
|
'aⁿ',
|
|
|
|
|
'a.',
|
2019-01-27 01:34:04 +01:00
|
|
|
|
'a:',
|
2019-01-27 23:52:33 +01:00
|
|
|
|
'a:ⁿ',
|
2019-01-27 01:34:04 +01:00
|
|
|
|
'ṷ',
|
2019-01-27 23:52:33 +01:00
|
|
|
|
'ṷ.',
|
|
|
|
|
'ṷⁿ',
|
|
|
|
|
#'ú', # only appears in word 'feeste'(út) and 'gaste'(út) which are 'f e: s t ə' and 'yn' in lex_asr.
|
2019-01-27 01:34:04 +01:00
|
|
|
|
'u',
|
2019-01-27 23:52:33 +01:00
|
|
|
|
'uⁿ',
|
|
|
|
|
'u.',
|
2019-01-27 01:34:04 +01:00
|
|
|
|
'u:',
|
2019-01-27 23:52:33 +01:00
|
|
|
|
'u:ⁿ',
|
2019-01-27 01:34:04 +01:00
|
|
|
|
'ü',
|
2019-01-27 23:52:33 +01:00
|
|
|
|
'ü.',
|
|
|
|
|
'üⁿ',
|
2019-01-27 01:34:04 +01:00
|
|
|
|
'ü:',
|
2019-01-27 23:52:33 +01:00
|
|
|
|
'ü:ⁿ',
|
2019-01-27 01:34:04 +01:00
|
|
|
|
'o',
|
2019-01-27 23:52:33 +01:00
|
|
|
|
'oⁿ',
|
|
|
|
|
'o.',
|
2019-01-27 01:34:04 +01:00
|
|
|
|
'o:',
|
2019-01-27 23:52:33 +01:00
|
|
|
|
'o:ⁿ',
|
2019-01-27 01:34:04 +01:00
|
|
|
|
'ö',
|
2019-01-27 23:52:33 +01:00
|
|
|
|
'ö.',
|
|
|
|
|
'öⁿ',
|
2019-01-27 01:34:04 +01:00
|
|
|
|
'ö:',
|
2019-01-27 23:52:33 +01:00
|
|
|
|
'ö:ⁿ',
|
2019-01-27 01:34:04 +01:00
|
|
|
|
'ɔ',
|
2019-01-27 23:52:33 +01:00
|
|
|
|
'ɔ.',
|
|
|
|
|
'ɔⁿ',
|
2019-01-27 01:34:04 +01:00
|
|
|
|
'ɔ:',
|
2019-01-27 23:52:33 +01:00
|
|
|
|
'ɔ:ⁿ',
|
|
|
|
|
#'ɔ̈', # not included in lex.ipa
|
|
|
|
|
'ɔ̈.',
|
2019-01-27 01:34:04 +01:00
|
|
|
|
'ɔ̈:',
|
|
|
|
|
|
|
|
|
|
# plosives
|
|
|
|
|
'p',
|
|
|
|
|
'b',
|
2019-01-27 23:52:33 +01:00
|
|
|
|
't',
|
|
|
|
|
'tⁿ',
|
2019-01-27 01:34:04 +01:00
|
|
|
|
'd',
|
|
|
|
|
'k',
|
|
|
|
|
'g',
|
2019-01-27 23:52:33 +01:00
|
|
|
|
'ɡ', # = 'g'
|
2019-01-27 01:34:04 +01:00
|
|
|
|
|
|
|
|
|
# nasals
|
|
|
|
|
'm',
|
|
|
|
|
'n',
|
|
|
|
|
'ŋ',
|
|
|
|
|
|
|
|
|
|
# fricatives
|
|
|
|
|
'f',
|
|
|
|
|
'v',
|
|
|
|
|
's',
|
|
|
|
|
's:',
|
|
|
|
|
'z',
|
2019-01-27 23:52:33 +01:00
|
|
|
|
'zⁿ',
|
2019-01-27 01:34:04 +01:00
|
|
|
|
'x',
|
|
|
|
|
'h',
|
2019-01-27 23:52:33 +01:00
|
|
|
|
|
|
|
|
|
# tap and flip
|
|
|
|
|
'r',
|
|
|
|
|
'r.', # only appears in word 'mearpartijestelsel'(does not exist in lex_asr) and 'tenoarpartij'.
|
|
|
|
|
'r:', # only appears in word 'mûsearflearmûs' and 'sjochdêr'.
|
|
|
|
|
|
|
|
|
|
# approximant
|
|
|
|
|
'j',
|
|
|
|
|
'j.',
|
|
|
|
|
'l'
|
2019-01-27 01:34:04 +01:00
|
|
|
|
]
|
|
|
|
|
|
2019-01-27 23:52:33 +01:00
|
|
|
|
## the list of multi character phones.
|
|
|
|
|
# for example, the length of 'i̯ⁿ' is 3, but in the codes it is treated as one letter.
|
2019-01-27 01:34:04 +01:00
|
|
|
|
multi_character_phones_ipa = [i for i in phoneset_ipa if len(i) > 1]
|
2019-01-27 23:52:33 +01:00
|
|
|
|
multi_character_phones_ipa.sort(key=len, reverse=True)
|