acoustic_model/acoustic_model/phoneset/fame_asr.py

""" definition of the phones to be used. """

# phonese in {FAME}/lexicon/lex.asr
phoneset = [
	# vowels
	'a',
	'a:',
	'e',
	'e:',
	'i',
	'i:',
	'i̯',
	'o',
	'o:',
	'ö',
	'ö:',
	'u',
	'u:',
	'ü',
	'ü:',
	#'ú', # only appears in word 'feeste'(út) and 'gaste'(út) which are 'f e: s t ə' and 'yn' in lex_asr. The pronunciation in Fries may be mistakes so I removed this phone. 
	'ṷ',
	'y',
	'ɔ',
	'ɔ:',
	'ɔ̈', 
	'ɔ̈:',
	'ə',
	'ɛ',
	'ɛ:',
	'ɪ',
	'ɪ:',

	# plosives
	'p', 
	'b', 
	't',
	'd', 
	'k',
	'g',
	'ɡ', # = 'g'

	# nasals
	'm',
	'n',
	'ŋ',
	
	# fricatives
	'f',
	'v',
	's',
	's:',
	'z',
	'x',
	'h',
	
	# tap and flip
	'r',
	'r:',

	# approximant
	'j',
	'l'
	]


## reduce the number of phones.
# the phones which seldom occur are replaced with another more popular phones.
# replacements are based on the advice from Martijn Wieling.
reduction_key = {
	'y':'i:', 'e':'e:', 'ə:':'ɛ:', 'r:':'r', 'ɡ':'g',
	# aki added because this is used in stimmen_project.
	'ɔ̈:':'ɔ:'
	}
# already removed beforehand in phoneset. Just to be sure.
phones_to_be_removed = ['ú', 's:']

def phone_reduction(phones):
	""" 
	Args:
		phones (list): list of phones.
	"""
	if sum([phone in phones for phone in phones_to_be_removed]) != 0:
		print('input includes phone(s) which is not defined in fame_asr.')
		print('those phone(s) are removed.')		
	return [reduction_key.get(i, i) for i in phones
		 if i not in phones_to_be_removed]

phoneset_short = list(set(phone_reduction(phoneset)))
phoneset_short.sort()


## translation_key to htk format (ascii).
# phones which gives UnicodeEncodeError when phone.encode("ascii")
# are replaced with other characters.
translation_key_asr2htk = {
	'i̯': 'i_',
	'ṷ': 'u_',

	# on the analogy of German umlaut, 'e' is used.
	'ö': 'oe', 'ö:': 'oe:', ''
	'ü': 'ue', 'ü:': 'ue:',

	# on the analogy of Chinese...
	'ŋ': 'ng',
				
	# refer to Xsampa. 
	'ɔ': 'O', 'ɔ:': 'O:', 'ɔ̈': 'Oe', 
	#'ɔ̈:': 'O:', # does not appear in FAME, but used in stimmen.
	'ɛ': 'E', 'ɛ:': 'E:',
	'ɪ': 'I', 'ɪ:': 'I:', 

	# it is @ in Xsampa, but that is not handy on HTK.
	'ə': 'A'
	}
phoneset_htk = [translation_key_asr2htk.get(i, i) for i in phoneset_short]

#not_in_ascii = [
#	'\'', 
#	'â', 'ê', 'ô', 'û', 'č', 
#	'à', 'í', 'é', 'è', 'ú', 'ć', 
#	'ä', 'ë', 'ï', 'ö', 'ü'
#]
translation_key_word2htk = {
	#'\'': '\\\'',
	'í':'i1', 'é':'e1', 'ú':'u1', 'ć':'c1',
	'à':'a2', 'è':'e2', 	
	'â':'a3', 'ê':'e3', 'ô':'o3', 'û':'u3', 
	'č':'c4',
	'ä': 'ao', 'ë': 'ee', 'ï': 'ie', 'ö': 'oe', 'ü': 'ue',
}
#[translation_key_word2htk.get(i, i) for i in not_in_ascii]
#Stop: p, b, t, d, k, g  
#Nasal: m, n, ng(ŋ)
#Fricative: s, z, f, v, h, x
#Liquid: l, r
#Vowel: a, a:, e:, i, i:, i_(i̯), o, o:, u, u:, u_(ṷ), oe(ö), oe:(ö:), ue(ü), ue:(ü:), O(ɔ), O:(ɔ:), Oe(ɔ̈), A(ə), E(ɛ), E:(ɛ:), I(ɪ), I:(ɪ:)


## the list of multi character phones. 
# for example, the length of 'a:' is 3, but in the codes it is treated as one letter.

# original.
multi_character_phones = [i for i in phoneset if len(i) > 1]
multi_character_phones.sort(key=len, reverse=True)

# phonset reduced.
multi_character_phones_short = [i for i in phoneset_short if len(i) > 1]
multi_character_phones_short.sort(key=len, reverse=True)

# htk compatible.
multi_character_phones_htk = [i for i in phoneset_htk if len(i) > 1]
multi_character_phones_htk.sort(key=len, reverse=True)
-												correspondence between lex.asr and lex.ipa is automatically obtained. header is added to the functions in fame_functions.py.

											
										
										
											2019-01-27 23:52:33 +01:00
+								""" definition of the phones to be used. """
-												lexicon is made.

											
										
										
											2019-01-29 21:52:11 +01:00
+								# phonese in {FAME}/lexicon/lex.asr
-												fame_asr phoneset is added including reduced version and htk compatible version.

											
										
										
											2019-01-28 12:34:20 +01:00
+								phoneset = [
-												phonset is given as fame_phoneset.py. translation key is obtained based on the information.

											
										
										
											2019-01-27 01:34:04 +01:00
+									# vowels
 									'a',
 									'a:',
-												lexicon is made.

											
										
										
											2019-01-29 21:52:11 +01:00
+									'e',
 									'e:',
 									'i',
 									'i:',
 									'i̯',
-												phonset is given as fame_phoneset.py. translation key is obtained based on the information.

											
										
										
											2019-01-27 01:34:04 +01:00
+									'o',
 									'o:',
 									'ö',
 									'ö:',
-												lexicon is made.

											
										
										
											2019-01-29 21:52:11 +01:00
+									'u',
 									'u:',
 									'ü',
 									'ü:',
 									#'ú', # only appears in word 'feeste'(út) and 'gaste'(út) which are 'f e: s t ə' and 'yn' in lex_asr. The pronunciation in Fries may be mistakes so I removed this phone.
 									'ṷ',
 									'y',
-												phonset is given as fame_phoneset.py. translation key is obtained based on the information.

											
										
										
											2019-01-27 01:34:04 +01:00
+									'ɔ',
 									'ɔ:',
-												lexicon is made.

											
										
										
											2019-01-29 21:52:11 +01:00
+									'ɔ̈',
-												phonset is given as fame_phoneset.py. translation key is obtained based on the information.

											
										
										
											2019-01-27 01:34:04 +01:00
+									'ɔ̈:',
-												lexicon is made.

											
										
										
											2019-01-29 21:52:11 +01:00
+									'ə',
 									'ɛ',
 									'ɛ:',
 									'ɪ',
 									'ɪ:',
-												phonset is given as fame_phoneset.py. translation key is obtained based on the information.

											
										
										
											2019-01-27 01:34:04 +01:00
 									# plosives
 									'p',
 									'b',
-												correspondence between lex.asr and lex.ipa is automatically obtained. header is added to the functions in fame_functions.py.

											
										
										
											2019-01-27 23:52:33 +01:00
+									't',
-												phonset is given as fame_phoneset.py. translation key is obtained based on the information.

											
										
										
											2019-01-27 01:34:04 +01:00
+									'd',
 									'k',
 									'g',
-												correspondence between lex.asr and lex.ipa is automatically obtained. header is added to the functions in fame_functions.py.

											
										
										
											2019-01-27 23:52:33 +01:00
+									'ɡ', # = 'g'
-												phonset is given as fame_phoneset.py. translation key is obtained based on the information.

											
										
										
											2019-01-27 01:34:04 +01:00
 									# nasals
 									'm',
 									'n',
 									'ŋ',
 									# fricatives
 									'f',
 									'v',
 									's',
 									's:',
 									'z',
 									'x',
 									'h',
-												lexicon is made.

											
										
										
											2019-01-29 21:52:11 +01:00
-												correspondence between lex.asr and lex.ipa is automatically obtained. header is added to the functions in fame_functions.py.

											
										
										
											2019-01-27 23:52:33 +01:00
+									# tap and flip
 									'r',
-												lexicon is made.

											
										
										
											2019-01-29 21:52:11 +01:00
+									'r:',
-												correspondence between lex.asr and lex.ipa is automatically obtained. header is added to the functions in fame_functions.py.

											
										
										
											2019-01-27 23:52:33 +01:00
 									# approximant
 									'j',
 									'l'
-												phonset is given as fame_phoneset.py. translation key is obtained based on the information.

											
										
										
											2019-01-27 01:34:04 +01:00
+									]
-												lexicon is made.

											
										
										
											2019-01-29 21:52:11 +01:00
 								## reduce the number of phones.
 								# the phones which seldom occur are replaced with another more popular phones.
 								# replacements are based on the advice from Martijn Wieling.
 								reduction_key = {
-												label alignment using HVite is added.

											
										
										
											2019-02-14 00:21:28 +01:00
+									'y':'i:', 'e':'e:', 'ə:':'ɛ:', 'r:':'r', 'ɡ':'g',
 									# aki added because this is used in stimmen_project.
 									'ɔ̈:':'ɔ:'
-												lexicon is made.

											
										
										
											2019-01-29 21:52:11 +01:00
+									}
 								# already removed beforehand in phoneset. Just to be sure.
-												label alignment using HVite is added.

											
										
										
											2019-02-14 00:21:28 +01:00
+								phones_to_be_removed = ['ú', 's:']
-												lexicon is made.

											
										
										
											2019-01-29 21:52:11 +01:00
-												make sure all the phones in stimmen transcription can be treated correctly.

											
										
										
											2019-02-06 00:00:14 +01:00
+								def phone_reduction(phones):
-												label alignment using HVite is added.

											
										
										
											2019-02-14 00:21:28 +01:00
+									"""
 									Args:
 										phones (list): list of phones.
 									"""
-												fame_phonetics.py and functions to make quests.hed to tie triphone are added.

											
										
										
											2019-03-25 00:06:53 +01:00
+									if sum([phone in phones for phone in phones_to_be_removed]) != 0:
 										print('input includes phone(s) which is not defined in fame_asr.')
 										print('those phone(s) are removed.')
-												make sure all the phones in stimmen transcription can be treated correctly.

											
										
										
											2019-02-06 00:00:14 +01:00
+									return [reduction_key.get(i, i) for i in phones
-												fame_phonetics.py and functions to make quests.hed to tie triphone are added.

											
										
										
											2019-03-25 00:06:53 +01:00
+										 if i not in phones_to_be_removed]
-												label alignment using HVite is added.

											
										
										
											2019-02-14 00:21:28 +01:00
-												make sure all the phones in stimmen transcription can be treated correctly.

											
										
										
											2019-02-06 00:00:14 +01:00
+								phoneset_short = list(set(phone_reduction(phoneset)))
-												lexicon is made.

											
										
										
											2019-01-29 21:52:11 +01:00
+								phoneset_short.sort()
-												make sure all the phones in stimmen transcription can be treated correctly.

											
										
										
											2019-02-06 00:00:14 +01:00
-												lexicon is made.

											
										
										
											2019-01-29 21:52:11 +01:00
+								## translation_key to htk format (ascii).
 								# phones which gives UnicodeEncodeError when phone.encode("ascii")
 								# are replaced with other characters.
 								translation_key_asr2htk = {
 									'i̯': 'i_',
 									'ṷ': 'u_',
 									# on the analogy of German umlaut, 'e' is used.
-												fame_phonetics.py and functions to make quests.hed to tie triphone are added.

											
										
										
											2019-03-25 00:06:53 +01:00
+									'ö': 'oe', 'ö:': 'oe:', ''
-												lexicon is made.

											
										
										
											2019-01-29 21:52:11 +01:00
+									'ü': 'ue', 'ü:': 'ue:',
 									# on the analogy of Chinese...
 									'ŋ': 'ng',
 									# refer to Xsampa.
-												label alignment using HVite is added.

											
										
										
											2019-02-14 00:21:28 +01:00
+									'ɔ': 'O', 'ɔ:': 'O:', 'ɔ̈': 'Oe',
 									#'ɔ̈:': 'O:', # does not appear in FAME, but used in stimmen.
-												lexicon is made.

											
										
										
											2019-01-29 21:52:11 +01:00
+									'ɛ': 'E', 'ɛ:': 'E:',
 									'ɪ': 'I', 'ɪ:': 'I:',
 									# it is @ in Xsampa, but that is not handy on HTK.
 									'ə': 'A'
 									}
 								phoneset_htk = [translation_key_asr2htk.get(i, i) for i in phoneset_short]
-												fix the bug there are characters in the lexicon which cannot be described in ascii.

											
										
										
											2019-02-03 00:34:35 +01:00
+								#not_in_ascii = [
 								#	'\'',
 								#	'â', 'ê', 'ô', 'û', 'č',
 								#	'à', 'í', 'é', 'è', 'ú', 'ć',
 								#	'ä', 'ë', 'ï', 'ö', 'ü'
 								#]
 								translation_key_word2htk = {
-												label files are extracted. hcompv_scp is made.

											
										
										
											2019-02-03 13:54:37 +01:00
+									#'\'': '\\\'',
-												fix the bug there are characters in the lexicon which cannot be described in ascii.

											
										
										
											2019-02-03 00:34:35 +01:00
+									'í':'i1', 'é':'e1', 'ú':'u1', 'ć':'c1',
 									'à':'a2', 'è':'e2',
 									'â':'a3', 'ê':'e3', 'ô':'o3', 'û':'u3',
 									'č':'c4',
 									'ä': 'ao', 'ë': 'ee', 'ï': 'ie', 'ö': 'oe', 'ü': 'ue',
 								}
 								#[translation_key_word2htk.get(i, i) for i in not_in_ascii]
-												test on stimmen data is added.

											
										
										
											2019-03-03 02:05:37 +01:00
+								#Stop: p, b, t, d, k, g
 								#Nasal: m, n, ng(ŋ)
 								#Fricative: s, z, f, v, h, x
 								#Liquid: l, r
 								#Vowel: a, a:, e:, i, i:, i_(i̯), o, o:, u, u:, u_(ṷ), oe(ö), oe:(ö:), ue(ü), ue:(ü:), O(ɔ), O:(ɔ:), Oe(ɔ̈), A(ə), E(ɛ), E:(ɛ:), I(ɪ), I:(ɪ:)
-												lexicon is made.

											
										
										
											2019-01-29 21:52:11 +01:00
-												correspondence between lex.asr and lex.ipa is automatically obtained. header is added to the functions in fame_functions.py.

											
										
										
											2019-01-27 23:52:33 +01:00
+								## the list of multi character phones.
-												lexicon is made.

											
										
										
											2019-01-29 21:52:11 +01:00
+								# for example, the length of 'a:' is 3, but in the codes it is treated as one letter.
 								# original.
-												fame_asr phoneset is added including reduced version and htk compatible version.

											
										
										
											2019-01-28 12:34:20 +01:00
+								multi_character_phones = [i for i in phoneset if len(i) > 1]
-												lexicon is made.

											
										
										
											2019-01-29 21:52:11 +01:00
+								multi_character_phones.sort(key=len, reverse=True)
 								# phonset reduced.
 								multi_character_phones_short = [i for i in phoneset_short if len(i) > 1]
 								multi_character_phones_short.sort(key=len, reverse=True)
 								# htk compatible.
 								multi_character_phones_htk = [i for i in phoneset_htk if len(i) > 1]
 								multi_character_phones_htk.sort(key=len, reverse=True)