<?xml version="1.0"?>
<?xml-stylesheet type="text/css" href="http://cslt.org/mediawiki/skins/common/feed.css?303"?>
<feed xmlns="http://www.w3.org/2005/Atom" xml:lang="zh-cn">
		<id>http://cslt.org/mediawiki/index.php?action=history&amp;feed=atom&amp;title=2014-07-18</id>
		<title>2014-07-18 - 版本历史</title>
		<link rel="self" type="application/atom+xml" href="http://cslt.org/mediawiki/index.php?action=history&amp;feed=atom&amp;title=2014-07-18"/>
		<link rel="alternate" type="text/html" href="http://cslt.org/mediawiki/index.php?title=2014-07-18&amp;action=history"/>
		<updated>2026-04-17T06:52:41Z</updated>
		<subtitle>本wiki的该页面的版本历史</subtitle>
		<generator>MediaWiki 1.23.3</generator>

	<entry>
		<id>http://cslt.org/mediawiki/index.php?title=2014-07-18&amp;diff=10471&amp;oldid=prev</id>
		<title>Zhaomy：/* Multilingual ASR */</title>
		<link rel="alternate" type="text/html" href="http://cslt.org/mediawiki/index.php?title=2014-07-18&amp;diff=10471&amp;oldid=prev"/>
				<updated>2014-07-18T02:34:30Z</updated>
		
		<summary type="html">&lt;p&gt;‎&lt;span dir=&quot;auto&quot;&gt;&lt;span class=&quot;autocomment&quot;&gt;Multilingual ASR&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;table class='diff diff-contentalign-left'&gt;
				&lt;col class='diff-marker' /&gt;
				&lt;col class='diff-content' /&gt;
				&lt;col class='diff-marker' /&gt;
				&lt;col class='diff-content' /&gt;
				&lt;tr style='vertical-align: top;'&gt;
				&lt;td colspan='2' style=&quot;background-color: white; color:black; text-align: center;&quot;&gt;←上一版本&lt;/td&gt;
				&lt;td colspan='2' style=&quot;background-color: white; color:black; text-align: center;&quot;&gt;2014年7月18日 (五) 02:34的版本&lt;/td&gt;
				&lt;/tr&gt;&lt;tr&gt;&lt;td colspan=&quot;2&quot; class=&quot;diff-lineno&quot;&gt;第26行：&lt;/td&gt;
&lt;td colspan=&quot;2&quot; class=&quot;diff-lineno&quot;&gt;第26行：&lt;/td&gt;&lt;/tr&gt;
&lt;tr&gt;&lt;td class='diff-marker'&gt;&amp;#160;&lt;/td&gt;&lt;td style=&quot;background-color: #f9f9f9; color: #333333; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #e6e6e6; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;&amp;#160; Tel201406.v1.0.S&amp;#160; |&amp;#160; &amp;#160; &amp;#160; &amp;#160;  |&amp;#160; &amp;#160; -&amp;#160; &amp;#160; |&amp;#160; &amp;#160; -&amp;#160; &amp;#160; |&amp;#160; &amp;#160; -&amp;#160; &amp;#160; |&amp;#160; &amp;#160; -&amp;#160; &amp;#160; |&amp;#160; &amp;#160; -&amp;#160; &amp;#160; |&lt;/div&gt;&lt;/td&gt;&lt;td class='diff-marker'&gt;&amp;#160;&lt;/td&gt;&lt;td style=&quot;background-color: #f9f9f9; color: #333333; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #e6e6e6; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;&amp;#160; Tel201406.v1.0.S&amp;#160; |&amp;#160; &amp;#160; &amp;#160; &amp;#160;  |&amp;#160; &amp;#160; -&amp;#160; &amp;#160; |&amp;#160; &amp;#160; -&amp;#160; &amp;#160; |&amp;#160; &amp;#160; -&amp;#160; &amp;#160; |&amp;#160; &amp;#160; -&amp;#160; &amp;#160; |&amp;#160; &amp;#160; -&amp;#160; &amp;#160; |&lt;/div&gt;&lt;/td&gt;&lt;/tr&gt;
&lt;tr&gt;&lt;td class='diff-marker'&gt;&amp;#160;&lt;/td&gt;&lt;td style=&quot;background-color: #f9f9f9; color: #333333; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #e6e6e6; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;&amp;#160; Tel201406.v1.1.S&amp;#160; |&amp;#160; &amp;#160; -&amp;#160; &amp;#160; |&amp;#160; &amp;#160; -&amp;#160; &amp;#160; |&amp;#160; &amp;#160; -&amp;#160; &amp;#160; |&amp;#160; &amp;#160; -&amp;#160; &amp;#160; |&amp;#160; &amp;#160; -&amp;#160; &amp;#160; |&amp;#160; &amp;#160; -&amp;#160; &amp;#160; |&lt;/div&gt;&lt;/td&gt;&lt;td class='diff-marker'&gt;&amp;#160;&lt;/td&gt;&lt;td style=&quot;background-color: #f9f9f9; color: #333333; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #e6e6e6; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;&amp;#160; Tel201406.v1.1.S&amp;#160; |&amp;#160; &amp;#160; -&amp;#160; &amp;#160; |&amp;#160; &amp;#160; -&amp;#160; &amp;#160; |&amp;#160; &amp;#160; -&amp;#160; &amp;#160; |&amp;#160; &amp;#160; -&amp;#160; &amp;#160; |&amp;#160; &amp;#160; -&amp;#160; &amp;#160; |&amp;#160; &amp;#160; -&amp;#160; &amp;#160; |&lt;/div&gt;&lt;/td&gt;&lt;/tr&gt;
&lt;tr&gt;&lt;td class='diff-marker'&gt;−&lt;/td&gt;&lt;td style=&quot;color:black; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #ffe49c; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;Tel201406.HW.v2.0.B|&amp;#160; 20.18&amp;#160; |&amp;#160; 17.49&amp;#160; |&amp;#160; 23.85&amp;#160; |&amp;#160; 22.81&amp;#160; |&amp;#160; 22.48&amp;#160; |&amp;#160; &lt;del class=&quot;diffchange diffchange-inline&quot;&gt;55&lt;/del&gt;.&lt;del class=&quot;diffchange diffchange-inline&quot;&gt;06 &lt;/del&gt; |&lt;/div&gt;&lt;/td&gt;&lt;td class='diff-marker'&gt;+&lt;/td&gt;&lt;td style=&quot;color:black; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #a3d3ff; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;Tel201406.HW.v2.0.B|&amp;#160; 20.18&amp;#160; |&amp;#160; 17.49&amp;#160; |&amp;#160; 23.85&amp;#160; |&amp;#160; 22.81&amp;#160; |&amp;#160; 22.48&amp;#160; |&amp;#160; &lt;ins class=&quot;diffchange diffchange-inline&quot;&gt;83&lt;/ins&gt;.&lt;ins class=&quot;diffchange diffchange-inline&quot;&gt;28 &lt;/ins&gt; |&lt;/div&gt;&lt;/td&gt;&lt;/tr&gt;
&lt;tr&gt;&lt;td class='diff-marker'&gt;−&lt;/td&gt;&lt;td style=&quot;color:black; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #ffe49c; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;Tel201406.HW.v2.0.S|&amp;#160; 19.95&amp;#160; |&amp;#160; 17.74&amp;#160; |&amp;#160; 23.73&amp;#160; |&amp;#160; 22.36&amp;#160; |&amp;#160; 22.49&amp;#160; |&amp;#160; &lt;del class=&quot;diffchange diffchange-inline&quot;&gt;37&lt;/del&gt;.&lt;del class=&quot;diffchange diffchange-inline&quot;&gt;63 &lt;/del&gt; |&lt;/div&gt;&lt;/td&gt;&lt;td class='diff-marker'&gt;+&lt;/td&gt;&lt;td style=&quot;color:black; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #a3d3ff; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;Tel201406.HW.v2.0.S|&amp;#160; 19.95&amp;#160; |&amp;#160; 17.74&amp;#160; |&amp;#160; 23.73&amp;#160; |&amp;#160; 22.36&amp;#160; |&amp;#160; 22.49&amp;#160; |&amp;#160; &lt;ins class=&quot;diffchange diffchange-inline&quot;&gt;67&lt;/ins&gt;.&lt;ins class=&quot;diffchange diffchange-inline&quot;&gt;70 &lt;/ins&gt; |&lt;/div&gt;&lt;/td&gt;&lt;/tr&gt;
&lt;tr&gt;&lt;td class='diff-marker'&gt;−&lt;/td&gt;&lt;td style=&quot;color:black; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #ffe49c; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;Tel201406.HW.v2.1.B|&amp;#160; 19.14&amp;#160; |&amp;#160; 16.97&amp;#160; |&amp;#160; 24.26&amp;#160; |&amp;#160; 22.28&amp;#160; |&amp;#160; 22.97&amp;#160; |&amp;#160; &lt;del class=&quot;diffchange diffchange-inline&quot;&gt;55&lt;/del&gt;.&lt;del class=&quot;diffchange diffchange-inline&quot;&gt;35 &lt;/del&gt; |&lt;/div&gt;&lt;/td&gt;&lt;td class='diff-marker'&gt;+&lt;/td&gt;&lt;td style=&quot;color:black; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #a3d3ff; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;Tel201406.HW.v2.1.B|&amp;#160; 19.14&amp;#160; |&amp;#160; 16.97&amp;#160; |&amp;#160; 24.26&amp;#160; |&amp;#160; 22.28&amp;#160; |&amp;#160; 22.97&amp;#160; |&amp;#160; &lt;ins class=&quot;diffchange diffchange-inline&quot;&gt;85&lt;/ins&gt;.&lt;ins class=&quot;diffchange diffchange-inline&quot;&gt;41 &lt;/ins&gt; |&lt;/div&gt;&lt;/td&gt;&lt;/tr&gt;
&lt;tr&gt;&lt;td class='diff-marker'&gt;−&lt;/td&gt;&lt;td style=&quot;color:black; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #ffe49c; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;Tel201406.HW.v2.1.S|&amp;#160; 19.44&amp;#160; |&amp;#160; 17.62&amp;#160; |&amp;#160; 24.49&amp;#160; |&amp;#160; 23.06&amp;#160; |&amp;#160; 23.60&amp;#160; |&amp;#160; &lt;del class=&quot;diffchange diffchange-inline&quot;&gt;44&lt;/del&gt;.&lt;del class=&quot;diffchange diffchange-inline&quot;&gt;81 &lt;/del&gt; |&lt;/div&gt;&lt;/td&gt;&lt;td class='diff-marker'&gt;+&lt;/td&gt;&lt;td style=&quot;color:black; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #a3d3ff; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;Tel201406.HW.v2.1.S|&amp;#160; 19.44&amp;#160; |&amp;#160; 17.62&amp;#160; |&amp;#160; 24.49&amp;#160; |&amp;#160; 23.06&amp;#160; |&amp;#160; 23.60&amp;#160; |&amp;#160; &lt;ins class=&quot;diffchange diffchange-inline&quot;&gt;74&lt;/ins&gt;.&lt;ins class=&quot;diffchange diffchange-inline&quot;&gt;61 &lt;/ins&gt; |&lt;/div&gt;&lt;/td&gt;&lt;/tr&gt;
&lt;tr&gt;&lt;td class='diff-marker'&gt;&amp;#160;&lt;/td&gt;&lt;td style=&quot;background-color: #f9f9f9; color: #333333; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #e6e6e6; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;&amp;lt;/pre&amp;gt;&lt;/div&gt;&lt;/td&gt;&lt;td class='diff-marker'&gt;&amp;#160;&lt;/td&gt;&lt;td style=&quot;background-color: #f9f9f9; color: #333333; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #e6e6e6; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;&amp;lt;/pre&amp;gt;&lt;/div&gt;&lt;/td&gt;&lt;/tr&gt;
&lt;tr&gt;&lt;td class='diff-marker'&gt;&amp;#160;&lt;/td&gt;&lt;td style=&quot;background-color: #f9f9f9; color: #333333; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #e6e6e6; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;/td&gt;&lt;td class='diff-marker'&gt;&amp;#160;&lt;/td&gt;&lt;td style=&quot;background-color: #f9f9f9; color: #333333; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #e6e6e6; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;/td&gt;&lt;/tr&gt;
&lt;/table&gt;</summary>
		<author><name>Zhaomy</name></author>	</entry>

	<entry>
		<id>http://cslt.org/mediawiki/index.php?title=2014-07-18&amp;diff=10469&amp;oldid=prev</id>
		<title>Cslt：以内容“==Resoruce Building==  == Leftover questions== * Asymmetric window: Great improvement on training set(WER 34% to 24%), however the improvement is lost on test.  * Multi...”创建新页面</title>
		<link rel="alternate" type="text/html" href="http://cslt.org/mediawiki/index.php?title=2014-07-18&amp;diff=10469&amp;oldid=prev"/>
				<updated>2014-07-18T01:54:13Z</updated>
		
		<summary type="html">&lt;p&gt;以内容“==Resoruce Building==  == Leftover questions== * Asymmetric window: Great improvement on training set(WER 34% to 24%), however the improvement is lost on test.  * Multi...”创建新页面&lt;/p&gt;
&lt;p&gt;&lt;b&gt;新页面&lt;/b&gt;&lt;/p&gt;&lt;div&gt;==Resoruce Building==&lt;br /&gt;
&lt;br /&gt;
== Leftover questions==&lt;br /&gt;
* Asymmetric window: Great improvement on training set(WER 34% to 24%), however the improvement is lost on test. &lt;br /&gt;
* Multi GPU training: Error encountered&lt;br /&gt;
* Multilanguage training&lt;br /&gt;
* Investigating LOUDS FST. &lt;br /&gt;
* CLG embedded decoder plus online compiler.&lt;br /&gt;
* DNN-GMM co-training&lt;br /&gt;
&lt;br /&gt;
== AM development ==&lt;br /&gt;
&lt;br /&gt;
=== Sparse DNN ===&lt;br /&gt;
* GA-based block sparsity (++++++++++)&lt;br /&gt;
&lt;br /&gt;
===Noise training===&lt;br /&gt;
:* Journal paper writing on going&lt;br /&gt;
&lt;br /&gt;
===Multilingual ASR===&lt;br /&gt;
&lt;br /&gt;
&amp;lt;pre&amp;gt;&lt;br /&gt;
&lt;br /&gt;
LM = Tel201406.HW.v2.1.1&lt;br /&gt;
&lt;br /&gt;
     AM\testset    |JS27H_100|  JS_2h  |ShanXi_2h|ShaanXi2h|Unknown2h|   ENG   |&lt;br /&gt;
 Tel201406.v1.0.S  |         |    -    |    -    |    -    |    -    |    -    |&lt;br /&gt;
 Tel201406.v1.1.S  |    -    |    -    |    -    |    -    |    -    |    -    |&lt;br /&gt;
Tel201406.HW.v2.0.B|  20.18  |  17.49  |  23.85  |  22.81  |  22.48  |  55.06  |&lt;br /&gt;
Tel201406.HW.v2.0.S|  19.95  |  17.74  |  23.73  |  22.36  |  22.49  |  37.63  |&lt;br /&gt;
Tel201406.HW.v2.1.B|  19.14  |  16.97  |  24.26  |  22.28  |  22.97  |  55.35  |&lt;br /&gt;
Tel201406.HW.v2.1.S|  19.44  |  17.62  |  24.49  |  23.06  |  23.60  |  44.81  |&lt;br /&gt;
&amp;lt;/pre&amp;gt;&lt;br /&gt;
&lt;br /&gt;
* v1.*: no English words involved.&lt;br /&gt;
* v2.*: with English words involved.&lt;br /&gt;
&lt;br /&gt;
===Denoising &amp;amp; Farfield ASR===&lt;br /&gt;
&lt;br /&gt;
* Sparse linear prediction. Need to correct the model.&lt;br /&gt;
* Use xEnt as the adaptation object, instead of MSE based feature mapping&lt;br /&gt;
* Use the simulation tool to add reverberation. &lt;br /&gt;
* [http://reverb2014.dereverberation.com/download.html]&lt;br /&gt;
* Investigate the impact of speech rate. Use Tencent 200h data to conduct the experiments.&lt;br /&gt;
* Investigate the correlation between phone speed &amp;amp; entropy.&lt;br /&gt;
&lt;br /&gt;
===VAD===&lt;br /&gt;
&lt;br /&gt;
* Waiting for engineering work&lt;br /&gt;
&lt;br /&gt;
===Scoring===&lt;br /&gt;
&lt;br /&gt;
* Refine the acoustic model with AMIDA database. problem solved by involving both wsj and AMIDA.&lt;br /&gt;
* Model ready for picking up&lt;br /&gt;
&lt;br /&gt;
&lt;br /&gt;
===Embedded decoder===&lt;br /&gt;
&lt;br /&gt;
* The first deliver is Emb201407_BG_v0.0&lt;br /&gt;
* Train two smaller network: 500x4+600, 400x4+500&lt;br /&gt;
&lt;br /&gt;
==LM development==&lt;br /&gt;
&lt;br /&gt;
===Domain specific LM===&lt;br /&gt;
&lt;br /&gt;
h2. Domain specific LM construction&lt;br /&gt;
&lt;br /&gt;
h3. TAG LM&lt;br /&gt;
* Some problems with the tagging. all numbers are tagged.&lt;br /&gt;
&lt;br /&gt;
h3. Chatting LM&lt;br /&gt;
* Building chatting lexicon&lt;br /&gt;
&lt;br /&gt;
&lt;br /&gt;
==Word2Vector==&lt;br /&gt;
&lt;br /&gt;
===W2V based doc classification===&lt;br /&gt;
&lt;br /&gt;
* Initial results variable Bayesian GMM obtained. Performance is not as good as the conventional GMM.&lt;br /&gt;
* &lt;br /&gt;
&lt;br /&gt;
==Semantic word tree==&lt;br /&gt;
&lt;br /&gt;
:* Version v2.0 released (filter with query log)&lt;br /&gt;
:* Please deliver to /nfs/disk/perm/data/corpora/semanticTree (Xingchao)&lt;br /&gt;
:* Version v3.0 under going. Further refinement with Baidu Baike hierarchy&lt;br /&gt;
&lt;br /&gt;
&lt;br /&gt;
==NN LM==&lt;br /&gt;
&lt;br /&gt;
* Character-based NNLM (6700 chars, 7gram), 500M data training done.&lt;br /&gt;
:* Inconsistent pattern in WER were found on Tenent test sets&lt;br /&gt;
:* probably need to use another test set to do investigation. &lt;br /&gt;
&lt;br /&gt;
* Investigate MS RNN LM training&lt;br /&gt;
&lt;br /&gt;
==Speaker ID==&lt;br /&gt;
* reading materials &lt;br /&gt;
* prepare to run sre08&lt;br /&gt;
&lt;br /&gt;
==Translation==&lt;br /&gt;
* Initial version released&lt;br /&gt;
* collecting more data (Xinhua parallel text, bible, name entity)  for the second version&lt;/div&gt;</summary>
		<author><name>Cslt</name></author>	</entry>

	</feed>