From ab3887c6ca34e4d01daac3badb7b7468aaa36e43 Mon Sep 17 00:00:00 2001
From: yemaozi88 <428968@gmail.com>
Date: Mon, 4 Feb 2019 20:32:12 +0100
Subject: [PATCH] sp is added to the model.

---
 .vs/acoustic_model/v15/.suo | Bin 97792 -> 97792 bytes
 acoustic_model/fame_hmm.py  | 120 ++++++++++++++++++++++++++++++------
 2 files changed, 100 insertions(+), 20 deletions(-)
diff --git a/.vs/acoustic_model/v15/.suo b/.vs/acoustic_model/v15/.suo
index 7775f45e621950b937c9b0523a5af065e8b353f2..ce9095444dca9c05b39c00500ddc4d81ab0ec4d8 100644
GIT binary patch
delta 2363
zcmb7^e^69a6vy{mc7cUOmY=TtTozDDlm+n@zg%EbGt`B|A4G<vhK0H!6(GTCC7Nik
zm+@(tQx9gF{z#GMv}%}Wqf<^Zq1oh2jXCBtQ-4&>(2P#T_Py}dXr^ZD&V1&ad+vSb
z-upfGUDth`>%Ok5AV#mzXtZF|=kvj62t=GHk7tuyO@BlV4PK)%L|pYs3)@W;$VnU3
zZbl>;7{DZu2Jrb<%Z9%b%mF$z{wGEf;7<if;88FWG=UT_4dj4%;4u&j;(^%LbkGih
zz!Z=yx{Kk211nJ1_058B0ma~DAPzJc_Ej(!WPxDdpPvZ75Tt`RHD09JCtz2pzL+1W
z`a8yKvd^~=&LZ$QhytZROpJle?=GKC8@tQ%^>u3WdH$YmZrTj==7UT%D(0Ie_@dA6
z>$Zh;9<MnE-B)02O!pRw>4LvUNQNfniDu;b;P`goiKE&vBDAjuLVFP}P_58j^hFce
zF9YkrMD4|xUwh&E+jE%b*WMq?MNCMK+P7<#z?rE1v*?S7Li<Lr90=_*KqwHGL1^z!
zCbSn9LuhXUB3=pW01JT7J_Kw4;xbH>-sfxg`Goc*z@M-JzEGqbb}4ug<bko;z^(+V
zftbGrwhBB2s=?D>EqDghfOVi2Ost*1W}6WA8IdGRIBIL?E}u-P{BwPBbgLSE1-1>m
z2Kasb@QJ!ya>v>gd*mPum@G`O7;lhl(7Hpum^dWIY27pL1`gsYd^cL0#w}SlWDAo`
zY^hjr7f1!K1F`sS*bcB)?Y{xLU-g9?2jIU6I@OpPmV+bR<*ACZsEg#OOy0=kT*h6I
z=3a9q<K~i7oo0)eS3Hu*8%vh+PYv08q~uHe*oqBe<iPO^-7Z3E<z7~hmOBy)lmfSw
zxXoeXF7A@&1j;WlxquDW3P>yV!EMFSrZxCt6<7^Kuu8Q`{n;KSu?)(QlGakBlr)dh
zlsfw%k}DX$*lJXat*2<tH`mYC_3v%8WuI~82MiWku#X1?FyKL}$HQ?28U+RZ9Z!i<
zMi*JMig}qC2XrJl(%%og^6P9<vXl^d_xw(`kmo^?tJsdXKD_}N&DZd;!?9L}8~p;F
zE~lnhb86^l>JP02d)6;b4Nh7Wxlj4fv7LI&1}w4iW`Mk#$<@rg!XEr0@`!o~rFi3t
z<$7|Ww_T0sDv`dM)5TJ5Wx?EDIVes)N4nfXA&RYLNH;EqwVEa=wyGhL>lp5Ukb)Zz
z8pHM>jem2U{7zAnwnrqkA3RCtlsiR1<TjYOxvW=D;%0AF7ga{e4CG#Wmrg17E(HZh
z4e6Ap<TYL*)PJCfF@@!h5_dTbiorQTavPK9jg|1gj}#ZDiO@Kk7ZKBJ+P-zmOlR{W
znm|pSHE&1m!&R8q7x&0}n7ok5T}<*UBa>n})K2sYcXlL6--l3=)McUw{@GizxOBLU
zYDJufcLz&t$rQ#<cT5YPYt78bZe6&pe*1<doXGvQiw}FP{I}ork~NBgsEHRl7RU{3
z;E0WAGp{*3J#3bBcINz?@ozTp=65;<7K>xHjFRkP0~hS<f0aqGUpz_U;^}3VR=&>U
zU5w}K?^F7Y)<hF2I^|<6#?N~fFu9Y-XZ(ZJ<YC0Pdq4jEcLxJRZF8l}S~4iMVbr!S
z#1lwNKF0XfpVPc)!So#s^lJkiB;-iwF_2b1#iW#6O82H4>06SVQDpQQV<~~?tTbaX
zedTpUQYl3j;%bezl%W#Umz*K=K_7)kjtGjEwkFUo0fhw`=}HuhAakI!Et#fBH=?OD
zLcGW0cPnv7yty&n&1T~CQ7mOX>^cW6)I~n2+eBH$8>cf$jxD@)fo@N^d?EX%GVid7
ztO5Vrh8Np#(7&&o%Kkf(1(`f)*!`_(R3Y7*53jS5qP_K*)Dz}eOia2pi|k&zl?KVP
zgtWXN-{E!Gs6W(GL0XT40zIpVd8#onXEr5x6RPNTIG6jAyh-(RD@>~0L>AssYxb5j
I(I>jU0C4jWK>z>%

delta 2590
zcma);4Nz3q702JXyj}N;1q9+M2n#H_2G}g00wM5LHv|(+A(N&?ElR8u8`x|FQbi;9
z5si&OcCYp&ozA3rQkte}>b}%Xs^hGZrmf9P+Eiz3r(>OtrK!_)nhr^mfYAS4pRH-9
zGr2RrJ?EbL?s?~)bKZM9G;JE1HjOl7n<Yt-!OZOJEQCZL?_^sJbN>C|vqk&QT%;~x
z?$HO>J|a6OIkVsn7}f&^Xb0Gu9M#av!LCSK=3p)qi?MhoWHERe6d1NrL*8e|8-|k(
z%m)pdVVbSSJQMiA9Am8#(hKeaI}F=A$UWdONeW4epqPw>Amm0v7fu&IcY{X5)&lu8
zL%(&?X3Tej8pA#p@&T~en2YOHLSF@zN7|aoL>f!Lm%%0=Qu-Ch4WJWLfNUT(-pyY&
zE%kgIv#nseVHGQ7(Cff5-~xQw^kiz<rGxuWiYCkxAwIzF=WjXv^ke=Zo6SB9<Fh{e
zU<e0dq;abyXHW!CXjnyEz6y%Kd|(5jj-pIrhsf5gGOd9w%Cr!OGF1UlrW_!ywL&fd
z>wq|LKBxtvOzFTV(_k_Kx7X=WEG`A2PTfF6EgWV*dJJ968=z-_+sh;}C(5LNyTQF6
z6^Jse1!CWWkpC$YI!0tbG}gcC#H+JQGX6Wofk<0P_GZJ!J%$wiwnW<IQ6K-gHJ|oE
zjoRL!nUfur6b-qLx*w8tcluS*94u<v+oq8u9R;J{yI>4_54-}t4_*a70LOrcDrU$Z
zLY_4A*A4k2$W#1?t>|RfLQzN1B04Jt@ZoW<-sd=xq8Bc>lA>j?s55Bkz=C)<#3H@P
z`<;XI2LBMh$9aF+9u~CgpXQrcbnee&xV`COa;}54MND(EsJD;edcXHMij}$<cjsNE
zxA-SzOL$@a70oYecQUQUtTnP#BGtQrNY67sq-P)Ge(()rE^N;mx;W!7^h00-90XCo
z!M7uAMS9pXLNTR*<S!yDt^~4NV#}8>Sq+4~22vM`-GReV-*PL3u(x0Mz)5+Z?+bj~
zS<WYY?^-Dg>lS0hz8ibQZ822xQl*;LPIJ|~8uI8}!52td#$xxoW$q3gwI-j{9$c8r
z>}1G6u?H1K>v*6gs9IK%E4{KwfAQ>J3&!oI7WMq&NJ));ytS8fck@+>wg)Y}*eWt}
zGotonM5ae^{|Kj-mUBO|@ZkD0+9R^cyi}q3SCdm$IuoR=W6|)(bV~muJcq<uje22#
zY`U@`VbZ)z>tfm#CX!#vv{6~zQbhH7ec#)pHL%!L#&q_=4Dp||r0eM|Z&2-It0y)7
zdlpm8@82l@X2Bi=l&lYOI6DvT;BNHK?;Ln_nk8ukTBR6LtZ6%$_NuI1Bx}%qvxj7E
zz4T9Q4bz@wC_2A<JWJ0y@fV8iouCEdQmYi+b{{cmbMF%&UwGRR$t>0T>$g{F2bnm7
za#X3Jbm90!^TqRYZT^Mx<$qqu)2sY^sCvk<`d#tPL9Tu^k)saVXrZdO$m^~12Lfdk
zb<KgQV8y-FOZ_!ZXLNS-Y+8TiP4BYX{iqo(x{J3?*!gb`IcP<6<{qJ_FS{t8=g)d_
z_a>c-A35=qq2tWS=SCfzPrIVs?u-L4JO@OOq9a#C+VXj8_baLA45L^$&p+@?#fDX)
z0UlnPCt@w*e>~*n2S;qwAxu2&d5gN!PO1FD$YQy!y0n%@4(&II*LiU?GQ@X9npn@)
zWD^ZHP?cVHcn<N7krHS5(yCJbj^>W;-c7xIoB6gQ`+3D{qxxuULl#N8>8Gb<^u)Pe
zG%@X$?DIVwIvx(ApW8j3qaXF)ORtk?yzk7hilSAirH_$ASAL78{1%H&9H4P-zf{d%
zn+j-uBJG&W-}}hJJ=b%2U}6C>p2~w$^Yx+YL!`xQvB?DS?GuW2hVj!AimrSFFJ~=k
zK?N1-#h>O7>wBClQzg9Xx{HTrM|kVh`()*H)62MWV~B5`R$_0<^x2b-l8v99ev-}^
zVLYN9vr!sfKIK(&Z1m2UgUtNu$Me(~8`*7=_)>@w<hDyS2>JkjeCDz<`7b7E_a&?p
zcPyk<x<h=HZw_Cg6N>og1aBR7tvFizVkWI7+_~(=ubt~V`$HT1Ha`*SMXTRxxBu<C
z_%#>hrbK6IKNIHP{!e5X(?$sR_9bk1Pf$E<A+4g+jknpm)DK*g8Q+mdS&TZ>i0FHC
zc>J0hcN$wn@|cIrV?MH}e<-J5Jm{k{q*ioLh!37ikMC@u-6`tiVp8IYLJ9j=BeAiE
rKr5Nm_cl^tyzpVVlA=~rQf@qV4P8s)tg|uRxQ@=Jjy;9z21x!F_%~6M

diff --git a/acoustic_model/fame_hmm.py b/acoustic_model/fame_hmm.py
index 881dec3..19d5f56 100644
--- a/acoustic_model/fame_hmm.py
+++ b/acoustic_model/fame_hmm.py
@@ -25,13 +25,17 @@ make_label		  = 0 # it takes roughly 4800 sec on Surface pro 2.
 make_htk_files    = 0
 extract_features  = 0
 flat_start		  = 0
-train_model_without_sp = 1
+train_model_without_sp = 0
+add_sp = 0
+train_model_with_sp    = 0
+
 
 
 # pre-defined values.
 
 dataset_list = ['devel', 'test', 'train']
 hmmdefs_name = 'hmmdefs'
+proto_name   = 'proto39'
 
 lexicon_asr = os.path.join(default.fame_dir, 'lexicon', 'lex.asr')
 lexicon_oov = os.path.join(default.fame_dir, 'lexicon', 'lex.oov')
@@ -41,7 +45,8 @@ config_hcopy = os.path.join(config_dir, 'config.HCopy')
 config_train = os.path.join(config_dir, 'config.train')
 global_ded   = os.path.join(config_dir, 'global.ded')
 mkphones_led = os.path.join(config_dir, 'mkphones.led')
-prototype    = os.path.join(config_dir, 'proto39')
+sil_hed		 = os.path.join(config_dir, 'sil.hed')
+prototype    = os.path.join(config_dir, proto_name)
 
 model_dir    = os.path.join(default.htk_dir, 'model')
 
@@ -55,6 +60,7 @@ lexicon_htk     = os.path.join(lexicon_dir, 'lex.htk')
 
 phonelist_txt = os.path.join(config_dir, 'phonelist.txt')
 model0_dir	  = os.path.join(model_dir, 'hmm0')
+model1_dir	  = os.path.join(model_dir, 'hmm1')
 
 feature_dir = os.path.join(default.htk_dir, 'mfc')
 if not os.path.exists(feature_dir):
@@ -66,6 +72,13 @@ label_dir = os.path.join(default.htk_dir, 'label')
 if not os.path.exists(label_dir):
 	os.makedirs(label_dir)
 
+## training
+hcompv_scp_train = os.path.join(tmp_dir, 'train.scp')
+mlf_file_train   = os.path.join(label_dir, 'train_phone.mlf')
+
+## train without sp
+niter_max = 10
+
 
 ## ======================= make lexicon for HTK =======================
 if make_lexicon:
@@ -95,6 +108,7 @@ if make_lexicon:
 
 ## ======================= make label files =======================
 if make_label:
+	# train_2002_gongfansaken_10347.lab is empty. should be removed.
 	for dataset in dataset_list:
 		timer_start = time.time()
 		print("==== making label files on dataset {}".format(dataset))
@@ -216,45 +230,111 @@ if extract_features:
 
 ## ======================= flat start monophones =======================
 if flat_start:
-	hcompv_scp = os.path.join(tmp_dir, 'test.scp')
-
 	timer_start = time.time()
 	print('==== flat start ====')
-	pyhtk.flat_start(config_train, hcompv_scp, model0_dir, prototype)
+	pyhtk.flat_start(config_train, hcompv_scp_train, model0_dir, prototype)
 
 	# allocate mean & variance to all phones in the phone list
+	print('>>> allocating mean & variance to all phones in the phone list...')
 	pyhtk.create_hmmdefs(
-		os.path.join(model0_dir, 'proto39'),
+		os.path.join(model0_dir, proto_name),
 	    os.path.join(model0_dir, 'hmmdefs'), 
 		phonelist_txt)
+
+	# make macros
+	print('>>> making macros...')
+	with open(os.path.join(model0_dir, 'vFloors')) as f:
+		lines = f.read()
+	with open(os.path.join(model0_dir, 'macros'), 'wb') as f:
+		f.write(bytes('~o <MFCC_0_D_A> <VecSize> 39\n' + lines, 'ascii'))
+	
 	print("elapsed time: {}".format(time.time() - timer_start))
 
 
-## ======================= estimate monophones =======================
+## ======================= train model without short pause =======================
 if train_model_without_sp:
-	hcompv_scp = os.path.join(tmp_dir, 'test.scp')
-	mlf_file = os.path.join(label_dir, 'test_phone.mlf')
-	output_dir = os.path.join(model_dir, 'hmm1')
-	fh.make_new_directory(output_dir)
+	fh.make_new_directory(model1_dir)
 
 	print('==== train model without sp ====')
-	if not os.path.exists(os.path.join(output_dir, 'iter0')):
-		shutil.copytree(model0_dir, os.path.join(output_dir, 'iter0'))
-	niter = 1
-	for niter in range(1, 5):
+	if not os.path.exists(os.path.join(model1_dir, 'iter0')):
+		shutil.copytree(model0_dir, os.path.join(model1_dir, 'iter0'))
+	for niter in range(1, niter_max):
 		timer_start = time.time()
 		hmm_n = 'iter' + str(niter)
 		hmm_n_pre = 'iter' + str(niter-1)
-		modeln_dir	   = os.path.join(output_dir, hmm_n)
-		modeln_dir_pre = os.path.join(output_dir, hmm_n_pre) 
+		modeln_dir	   = os.path.join(model1_dir, hmm_n)
+		modeln_dir_pre = os.path.join(model1_dir, hmm_n_pre) 
 		
 		# re-estimation
 		fh.make_new_directory(modeln_dir)
 		pyhtk.re_estimation(
 			config_train,
-			os.path.join(modeln_dir_pre, 'proto39'),
+			os.path.join(modeln_dir_pre, 'macros'),
 			os.path.join(modeln_dir_pre, hmmdefs_name), 
 			modeln_dir,
-			hcompv_scp, phonelist_txt,
-			mlf_file=mlf_file)
+			hcompv_scp_train, phonelist_txt,
+			mlf_file=mlf_file_train)
+		print("elapsed time: {}".format(time.time() - timer_start))
+
+
+## ======================= adding sp to the model =======================
+if add_sp:
+	print('==== adding sp to the model ====')
+
+	# make model with sp.
+	print('>>> modifying the last model in the previous step...')
+	modeln_dir_pre = os.path.join(model1_dir, 'iter'+str(niter_max-1))
+	modeln_dir = modeln_dir_pre.replace('iter' + str(niter_max-1), 'iter' + str(niter_max))
+	fh.make_new_directory(modeln_dir)
+	shutil.copy(
+		os.path.join(modeln_dir_pre, 'macros'), 
+		os.path.join(modeln_dir, 'macros'))
+	shutil.copy(
+		os.path.join(modeln_dir_pre, hmmdefs_name), 
+		os.path.join(modeln_dir, hmmdefs_name))
+
+	## ======================= 
+	## manually make changes to modeln_dir/hmmdefs 
+	## ======================= 
+	# add states 'sil'.
+	# http://www.f.waseda.jp/yusukekondo/htk.html#flat_start_estimation
+	#shutil.copy(
+	#	os.path.join(model_dir, 'hmmdefs.txt'), 
+	#	os.path.join(modeln_dir, hmmdefs_name))
+
+	#hmmdefs_file_pre = os.path.join(modeln_dir_pre, hmmdefs_name)
+	hmmdefs_file = os.path.join(modeln_dir, hmmdefs_name)
+	macros_file  = os.path.join(modeln_dir, 'macros')
+	#with open(hmmdefs_file_pre) as f:
+	#	lines = f.read()
+	#lines_ = lines.split('~h ')
+	#sil_model = [line for line in lines_ if line.split('\n')[0].replace('"', '') == 'sil'][0]
+	
+	# update hmmdefs and macros.
+	print('>>> updating hmmdefs and macros...')
+	modeln_dir_pre = modeln_dir
+	modeln_dir = modeln_dir.replace('iter' + str(niter_max), 'iter' + str(niter_max+1))
+	fh.make_new_directory(modeln_dir)
+	pyhtk.include_sil_in_hmmdefs(macros_file, hmmdefs_file, modeln_dir, sil_hed, phonelist_txt)
+
+
+## ======================= train model with short pause =======================
+if train_model_with_sp:
+	print('==== train model with sp ====')
+	for niter in range(niter_max+1, niter_max*2+1):
+		timer_start = time.time()
+		hmm_n = 'iter' + str(niter)
+		hmm_n_pre = 'iter' + str(niter-1)
+		modeln_dir	   = os.path.join(model1_dir, hmm_n)
+		modeln_dir_pre = os.path.join(model1_dir, hmm_n_pre) 
+		
+		# re-estimation
+		fh.make_new_directory(modeln_dir)
+		pyhtk.re_estimation(
+			config_train,
+			os.path.join(modeln_dir_pre, 'macros'),
+			os.path.join(modeln_dir_pre, hmmdefs_name), 
+			modeln_dir,
+			hcompv_scp_train, phonelist_txt,
+			mlf_file=mlf_file_train)
 		print("elapsed time: {}".format(time.time() - timer_start))
\ No newline at end of file