<?xml version="1.0"?>
<?xml-stylesheet type="text/css" href="http://www.cslt.org/mediawiki/skins/common/feed.css?303"?>
<feed xmlns="http://www.w3.org/2005/Atom" xml:lang="zh-cn">
		<id>http://www.cslt.org/mediawiki/index.php?action=history&amp;feed=atom&amp;title=2014-04-04</id>
		<title>2014-04-04 - 版本历史</title>
		<link rel="self" type="application/atom+xml" href="http://www.cslt.org/mediawiki/index.php?action=history&amp;feed=atom&amp;title=2014-04-04"/>
		<link rel="alternate" type="text/html" href="http://www.cslt.org/mediawiki/index.php?title=2014-04-04&amp;action=history"/>
		<updated>2026-04-04T01:47:10Z</updated>
		<subtitle>本wiki的该页面的版本历史</subtitle>
		<generator>MediaWiki 1.23.3</generator>

	<entry>
		<id>http://www.cslt.org/mediawiki/index.php?title=2014-04-04&amp;diff=9585&amp;oldid=prev</id>
		<title>2014年4月4日 (五) 01:59 Cslt</title>
		<link rel="alternate" type="text/html" href="http://www.cslt.org/mediawiki/index.php?title=2014-04-04&amp;diff=9585&amp;oldid=prev"/>
				<updated>2014-04-04T01:59:58Z</updated>
		
		<summary type="html">&lt;p&gt;&lt;/p&gt;
&lt;table class='diff diff-contentalign-left'&gt;
				&lt;col class='diff-marker' /&gt;
				&lt;col class='diff-content' /&gt;
				&lt;col class='diff-marker' /&gt;
				&lt;col class='diff-content' /&gt;
				&lt;tr style='vertical-align: top;'&gt;
				&lt;td colspan='2' style=&quot;background-color: white; color:black; text-align: center;&quot;&gt;←上一版本&lt;/td&gt;
				&lt;td colspan='2' style=&quot;background-color: white; color:black; text-align: center;&quot;&gt;2014年4月4日 (五) 01:59的版本&lt;/td&gt;
				&lt;/tr&gt;&lt;tr&gt;&lt;td colspan=&quot;2&quot; class=&quot;diff-lineno&quot;&gt;第49行：&lt;/td&gt;
&lt;td colspan=&quot;2&quot; class=&quot;diff-lineno&quot;&gt;第49行：&lt;/td&gt;&lt;/tr&gt;
&lt;tr&gt;&lt;td class='diff-marker'&gt;&amp;#160;&lt;/td&gt;&lt;td style=&quot;background-color: #f9f9f9; color: #333333; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #e6e6e6; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;* Found errors attributed to speaker2utterance&lt;/div&gt;&lt;/td&gt;&lt;td class='diff-marker'&gt;&amp;#160;&lt;/td&gt;&lt;td style=&quot;background-color: #f9f9f9; color: #333333; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #e6e6e6; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;* Found errors attributed to speaker2utterance&lt;/div&gt;&lt;/td&gt;&lt;/tr&gt;
&lt;tr&gt;&lt;td class='diff-marker'&gt;&amp;#160;&lt;/td&gt;&lt;td style=&quot;background-color: #f9f9f9; color: #333333; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #e6e6e6; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;/td&gt;&lt;td class='diff-marker'&gt;&amp;#160;&lt;/td&gt;&lt;td style=&quot;background-color: #f9f9f9; color: #333333; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #e6e6e6; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;/td&gt;&lt;/tr&gt;
&lt;tr&gt;&lt;td class='diff-marker'&gt;−&lt;/td&gt;&lt;td style=&quot;color:black; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #ffe49c; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;===Denoising &amp;amp; Farfield ASR&lt;del class=&quot;diffchange diffchange-inline&quot;&gt;=&lt;/del&gt;===&lt;/div&gt;&lt;/td&gt;&lt;td class='diff-marker'&gt;+&lt;/td&gt;&lt;td style=&quot;color:black; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #a3d3ff; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;===Denoising &amp;amp; Farfield ASR===&lt;/div&gt;&lt;/td&gt;&lt;/tr&gt;
&lt;tr&gt;&lt;td class='diff-marker'&gt;&amp;#160;&lt;/td&gt;&lt;td style=&quot;background-color: #f9f9f9; color: #333333; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #e6e6e6; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;* First round of recording failed&lt;/div&gt;&lt;/td&gt;&lt;td class='diff-marker'&gt;&amp;#160;&lt;/td&gt;&lt;td style=&quot;background-color: #f9f9f9; color: #333333; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #e6e6e6; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;* First round of recording failed&lt;/div&gt;&lt;/td&gt;&lt;/tr&gt;
&lt;tr&gt;&lt;td class='diff-marker'&gt;&amp;#160;&lt;/td&gt;&lt;td style=&quot;background-color: #f9f9f9; color: #333333; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #e6e6e6; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;* Record farfield wave in next week&lt;/div&gt;&lt;/td&gt;&lt;td class='diff-marker'&gt;&amp;#160;&lt;/td&gt;&lt;td style=&quot;background-color: #f9f9f9; color: #333333; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #e6e6e6; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;* Record farfield wave in next week&lt;/div&gt;&lt;/td&gt;&lt;/tr&gt;
&lt;/table&gt;</summary>
		<author><name>Cslt</name></author>	</entry>

	<entry>
		<id>http://www.cslt.org/mediawiki/index.php?title=2014-04-04&amp;diff=9584&amp;oldid=prev</id>
		<title>Cslt：以内容“==Resoruce Building== * Current text resource has been re-arranged and listed  == Leftover questions== * Asymmetric window: Great improvement on training set(WER 34% to...”创建新页面</title>
		<link rel="alternate" type="text/html" href="http://www.cslt.org/mediawiki/index.php?title=2014-04-04&amp;diff=9584&amp;oldid=prev"/>
				<updated>2014-04-04T01:58:10Z</updated>
		
		<summary type="html">&lt;p&gt;以内容“==Resoruce Building== * Current text resource has been re-arranged and listed  == Leftover questions== * Asymmetric window: Great improvement on training set(WER 34% to...”创建新页面&lt;/p&gt;
&lt;p&gt;&lt;b&gt;新页面&lt;/b&gt;&lt;/p&gt;&lt;div&gt;==Resoruce Building==&lt;br /&gt;
* Current text resource has been re-arranged and listed&lt;br /&gt;
&lt;br /&gt;
== Leftover questions==&lt;br /&gt;
* Asymmetric window: Great improvement on training set(WER 34% to 24%), however the improvement is lost on test. Overfitting? &lt;br /&gt;
* Multi GPU training: Error encountered&lt;br /&gt;
* Multilanguage training&lt;br /&gt;
* Investigating LOUDS FST. &lt;br /&gt;
* CLG embedded decoder plus online compiler.&lt;br /&gt;
* DNN-GMM co-training&lt;br /&gt;
&lt;br /&gt;
== AM development ==&lt;br /&gt;
&lt;br /&gt;
=== Sparse DNN ===&lt;br /&gt;
* GA-based block sparsity&lt;br /&gt;
:* Found a paper in 2000 with similar ideas. &lt;br /&gt;
:* Try to get a student working on high performance computing to do the optimization&lt;br /&gt;
&lt;br /&gt;
===Noise training===&lt;br /&gt;
:* More experiments with no-noise&lt;br /&gt;
:* More experiments with additional noise types&lt;br /&gt;
&lt;br /&gt;
&lt;br /&gt;
===AMR compression re-training===&lt;br /&gt;
&lt;br /&gt;
* 1700h MPE adaptation&lt;br /&gt;
&lt;br /&gt;
:* iter1:&lt;br /&gt;
amr: %WER 13.40 [ 6398 / 47753, 252 ins, 829 del, 5317 sub ]&lt;br /&gt;
wav: %WER 11.19 [ 5343 / 47753, 178 ins, 710 del, 4455 sub ]&lt;br /&gt;
&lt;br /&gt;
:* iter2:&lt;br /&gt;
amr: %WER 13.31 [ 6358 / 47753, 255 ins, 798 del, 5305 sub ]&lt;br /&gt;
wav: %WER 11.33 [ 5409 / 47753, 180 ins, 732 del, 4497 sub ]&lt;br /&gt;
&lt;br /&gt;
:* iter3:&lt;br /&gt;
amr: %WER 13.25 [ 6326 / 47753, 230 ins, 823 del, 5273 sub ]&lt;br /&gt;
wav: %WER 11.43 [ 5460 / 47753, 199 ins, 709 del, 4552 sub ]&lt;br /&gt;
&lt;br /&gt;
:* iter4:&lt;br /&gt;
amr: %WER 13.17 [ 6289 / 47753, 225 ins, 833 del, 5231 sub ]&lt;br /&gt;
wav: %WER 11.44 [ 5461 / 47753, 200 ins, 693 del, 4568 sub ]&lt;br /&gt;
&lt;br /&gt;
:* iter5:&lt;br /&gt;
amr: %WER 13.17 [ 6291 / 47753, 254 ins, 769 del, 5268 sub ]&lt;br /&gt;
wav: %WER 11.46 [ 5471 / 47753, 200 ins, 696 del, 4575 sub ]&lt;br /&gt;
&lt;br /&gt;
===GFbank===&lt;br /&gt;
* Found errors attributed to speaker2utterance&lt;br /&gt;
&lt;br /&gt;
===Denoising &amp;amp; Farfield ASR====&lt;br /&gt;
* First round of recording failed&lt;br /&gt;
* Record farfield wave in next week&lt;br /&gt;
&lt;br /&gt;
===VAD===&lt;br /&gt;
* Source code prepared&lt;br /&gt;
* Prepare DNN pipeline&lt;br /&gt;
&lt;br /&gt;
&lt;br /&gt;
==Word to Vector==&lt;br /&gt;
&lt;br /&gt;
* LDA baseline (sogou 1700*9 training set)&lt;br /&gt;
:* Training done&lt;br /&gt;
:* Training classifier &lt;br /&gt;
&lt;br /&gt;
&lt;br /&gt;
==LM development==&lt;br /&gt;
&lt;br /&gt;
===NN LM===&lt;br /&gt;
&lt;br /&gt;
* Character-based NNLM (6700 chars, 7gram), 500M data training done.&lt;br /&gt;
:* boundary-involved char NNLM training done&lt;br /&gt;
:* Word-boundary seems less important than char history&lt;br /&gt;
&lt;br /&gt;
* Investigate MS RNN LM training&lt;br /&gt;
&lt;br /&gt;
&lt;br /&gt;
==Pronunciation scoring==&lt;br /&gt;
* 8k model delivered&lt;br /&gt;
* MLP-based scoring completed&lt;br /&gt;
&lt;br /&gt;
&lt;br /&gt;
==QA==&lt;br /&gt;
&lt;br /&gt;
===FST-based matching===&lt;br /&gt;
:* Char FST on investigation &lt;br /&gt;
:* FST-based QA patent done&lt;br /&gt;
&lt;br /&gt;
===Speech QA===&lt;br /&gt;
*Class LM QA&lt;br /&gt;
:* excellent done&lt;br /&gt;
:* investigated various stepping-in weights, found negative weights (-1) is effective for encourage entity recognition&lt;br /&gt;
:* investigated performance reduction due to the preference on small words. Introduced a factor on L.fst to discourage short words.&lt;/div&gt;</summary>
		<author><name>Cslt</name></author>	</entry>

	</feed>