<?xml version="1.0"?>
<?xml-stylesheet type="text/css" href="http://www.cslt.org/mediawiki/skins/common/feed.css?303"?>
<feed xmlns="http://www.w3.org/2005/Atom" xml:lang="zh-cn">
		<id>http://www.cslt.org/mediawiki/index.php?action=history&amp;feed=atom&amp;title=2013-08-23</id>
		<title>2013-08-23 - 版本历史</title>
		<link rel="self" type="application/atom+xml" href="http://www.cslt.org/mediawiki/index.php?action=history&amp;feed=atom&amp;title=2013-08-23"/>
		<link rel="alternate" type="text/html" href="http://www.cslt.org/mediawiki/index.php?title=2013-08-23&amp;action=history"/>
		<updated>2026-04-04T02:02:45Z</updated>
		<subtitle>本wiki的该页面的版本历史</subtitle>
		<generator>MediaWiki 1.23.3</generator>

	<entry>
		<id>http://www.cslt.org/mediawiki/index.php?title=2013-08-23&amp;diff=8068&amp;oldid=prev</id>
		<title>Cslt：/* GFCC DNN */</title>
		<link rel="alternate" type="text/html" href="http://www.cslt.org/mediawiki/index.php?title=2013-08-23&amp;diff=8068&amp;oldid=prev"/>
				<updated>2013-08-23T03:13:35Z</updated>
		
		<summary type="html">&lt;p&gt;‎&lt;span dir=&quot;auto&quot;&gt;&lt;span class=&quot;autocomment&quot;&gt;GFCC DNN&lt;/span&gt;&lt;/span&gt;&lt;/p&gt;
&lt;table class='diff diff-contentalign-left'&gt;
				&lt;col class='diff-marker' /&gt;
				&lt;col class='diff-content' /&gt;
				&lt;col class='diff-marker' /&gt;
				&lt;col class='diff-content' /&gt;
				&lt;tr style='vertical-align: top;'&gt;
				&lt;td colspan='2' style=&quot;background-color: white; color:black; text-align: center;&quot;&gt;←上一版本&lt;/td&gt;
				&lt;td colspan='2' style=&quot;background-color: white; color:black; text-align: center;&quot;&gt;2013年8月23日 (五) 03:13的版本&lt;/td&gt;
				&lt;/tr&gt;&lt;tr&gt;&lt;td colspan=&quot;2&quot; class=&quot;diff-lineno&quot;&gt;第77行：&lt;/td&gt;
&lt;td colspan=&quot;2&quot; class=&quot;diff-lineno&quot;&gt;第77行：&lt;/td&gt;&lt;/tr&gt;
&lt;tr&gt;&lt;td class='diff-marker'&gt;&amp;#160;&lt;/td&gt;&lt;td style=&quot;background-color: #f9f9f9; color: #333333; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #e6e6e6; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;&amp;#160;&amp;#160; &amp;#160; speedup: %WER 60.38 [ 3173 / 5255, 25 ins, 1061 del, 2087 sub ]&lt;/div&gt;&lt;/td&gt;&lt;td class='diff-marker'&gt;&amp;#160;&lt;/td&gt;&lt;td style=&quot;background-color: #f9f9f9; color: #333333; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #e6e6e6; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;&amp;#160;&amp;#160; &amp;#160; speedup: %WER 60.38 [ 3173 / 5255, 25 ins, 1061 del, 2087 sub ]&lt;/div&gt;&lt;/td&gt;&lt;/tr&gt;
&lt;tr&gt;&lt;td class='diff-marker'&gt;&amp;#160;&lt;/td&gt;&lt;td style=&quot;background-color: #f9f9f9; color: #333333; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #e6e6e6; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;/td&gt;&lt;td class='diff-marker'&gt;&amp;#160;&lt;/td&gt;&lt;td style=&quot;background-color: #f9f9f9; color: #333333; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #e6e6e6; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;/td&gt;&lt;/tr&gt;
&lt;tr&gt;&lt;td class='diff-marker'&gt;−&lt;/td&gt;&lt;td style=&quot;color:black; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #ffe49c; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;&amp;lt;/pre&amp;gt; &amp;#160;&lt;/div&gt;&lt;/td&gt;&lt;td class='diff-marker'&gt;+&lt;/td&gt;&lt;td style=&quot;color:black; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #a3d3ff; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;&amp;lt;/pre&amp;gt;&lt;/div&gt;&lt;/td&gt;&lt;/tr&gt;
&lt;tr&gt;&lt;td class='diff-marker'&gt;−&lt;/td&gt;&lt;td style=&quot;color:black; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #ffe49c; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;&amp;#160;&lt;/div&gt;&lt;/td&gt;&lt;td class='diff-marker'&gt;+&lt;/td&gt;&lt;td style=&quot;color:black; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #a3d3ff; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;&lt;/div&gt;&lt;/td&gt;&lt;/tr&gt;
&lt;tr&gt;&lt;td class='diff-marker'&gt;&amp;#160;&lt;/td&gt;&lt;td style=&quot;background-color: #f9f9f9; color: #333333; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #e6e6e6; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;/td&gt;&lt;td class='diff-marker'&gt;&amp;#160;&lt;/td&gt;&lt;td style=&quot;background-color: #f9f9f9; color: #333333; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #e6e6e6; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;/td&gt;&lt;/tr&gt;
&lt;tr&gt;&lt;td colspan=&quot;2&quot;&gt;&amp;#160;&lt;/td&gt;&lt;td class='diff-marker'&gt;+&lt;/td&gt;&lt;td style=&quot;color:black; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #a3d3ff; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;&lt;ins style=&quot;font-weight: bold; text-decoration: none;&quot;&gt;* GFCC is generally better than MFCC, particularly with noise&lt;/ins&gt;&lt;/div&gt;&lt;/td&gt;&lt;/tr&gt;
&lt;tr&gt;&lt;td colspan=&quot;2&quot;&gt;&amp;#160;&lt;/td&gt;&lt;td class='diff-marker'&gt;+&lt;/td&gt;&lt;td style=&quot;color:black; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #a3d3ff; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;&lt;ins style=&quot;font-weight: bold; text-decoration: none;&quot;&gt;* noise impact is significantly high. Need de-noise algorithms&lt;/ins&gt;&lt;/div&gt;&lt;/td&gt;&lt;/tr&gt;
&lt;tr&gt;&lt;td colspan=&quot;2&quot;&gt;&amp;#160;&lt;/td&gt;&lt;td class='diff-marker'&gt;+&lt;/td&gt;&lt;td style=&quot;color:black; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #a3d3ff; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;&lt;ins style=&quot;font-weight: bold; text-decoration: none;&quot;&gt;* Try noise-robust training&lt;/ins&gt;&lt;/div&gt;&lt;/td&gt;&lt;/tr&gt;
&lt;tr&gt;&lt;td class='diff-marker'&gt;&amp;#160;&lt;/td&gt;&lt;td style=&quot;background-color: #f9f9f9; color: #333333; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #e6e6e6; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;/td&gt;&lt;td class='diff-marker'&gt;&amp;#160;&lt;/td&gt;&lt;td style=&quot;background-color: #f9f9f9; color: #333333; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #e6e6e6; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;/td&gt;&lt;/tr&gt;
&lt;tr&gt;&lt;td class='diff-marker'&gt;&amp;#160;&lt;/td&gt;&lt;td style=&quot;background-color: #f9f9f9; color: #333333; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #e6e6e6; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;==Stream decoding==&lt;/div&gt;&lt;/td&gt;&lt;td class='diff-marker'&gt;&amp;#160;&lt;/td&gt;&lt;td style=&quot;background-color: #f9f9f9; color: #333333; font-size: 88%; border-style: solid; border-width: 1px 1px 1px 4px; border-radius: 0.33em; border-color: #e6e6e6; vertical-align: top; white-space: pre-wrap;&quot;&gt;&lt;div&gt;==Stream decoding==&lt;/div&gt;&lt;/td&gt;&lt;/tr&gt;
&lt;/table&gt;</summary>
		<author><name>Cslt</name></author>	</entry>

	<entry>
		<id>http://www.cslt.org/mediawiki/index.php?title=2013-08-23&amp;diff=8067&amp;oldid=prev</id>
		<title>Cslt：以内容“== Data sharing ==  * LM count files still undelivered!  == DNN progress ==  === Discriminative DNN ===  * Running 1200-3620 NN, graph generation is done. Training is s...”创建新页面</title>
		<link rel="alternate" type="text/html" href="http://www.cslt.org/mediawiki/index.php?title=2013-08-23&amp;diff=8067&amp;oldid=prev"/>
				<updated>2013-08-23T02:55:56Z</updated>
		
		<summary type="html">&lt;p&gt;以内容“== Data sharing ==  * LM count files still undelivered!  == DNN progress ==  === Discriminative DNN ===  * Running 1200-3620 NN, graph generation is done. Training is s...”创建新页面&lt;/p&gt;
&lt;p&gt;&lt;b&gt;新页面&lt;/b&gt;&lt;/p&gt;&lt;div&gt;== Data sharing ==&lt;br /&gt;
&lt;br /&gt;
* LM count files still undelivered!&lt;br /&gt;
&lt;br /&gt;
== DNN progress ==&lt;br /&gt;
&lt;br /&gt;
=== Discriminative DNN ===&lt;br /&gt;
&lt;br /&gt;
* Running 1200-3620 NN, graph generation is done. Training is still running stupidly. &lt;br /&gt;
&lt;br /&gt;
=== Sparse DNN ===&lt;br /&gt;
&lt;br /&gt;
* Iterative sparse sticky training runs. &lt;br /&gt;
&lt;br /&gt;
=== Tencent exps ===&lt;br /&gt;
&lt;br /&gt;
&lt;br /&gt;
==DNN Confidence estimation==&lt;br /&gt;
&lt;br /&gt;
* Tested on a high WER test set. The distribution curve is still bizzard, for both correct and incorrect words, a high peak is around zero.&lt;br /&gt;
* Accumulated DNN confidence is on development. &lt;br /&gt;
* Generate lattice-based confidence&lt;br /&gt;
* Prepare MLP-based confidence integration&lt;br /&gt;
&lt;br /&gt;
&lt;br /&gt;
==GFCC DNN ==&lt;br /&gt;
&lt;br /&gt;
*GFCC computing is highly slow. 100 hour speech costs 16 hour cpu time. RT is around 0.2. It is intolerable. &lt;br /&gt;
*100 hour GFCC-based DNN, Tencent test results:&lt;br /&gt;
&lt;br /&gt;
&amp;lt;pre&amp;gt;&lt;br /&gt;
&lt;br /&gt;
No noise-added:&lt;br /&gt;
&lt;br /&gt;
1,MFCC 100_1200_1200_1200_1200_3580&lt;br /&gt;
       map: %WER 23.75 [ 3474 / 14628, 134 ins, 373 del, 2967 sub ]&lt;br /&gt;
       2044: %WER 21.47 [ 4991 / 23241, 304 ins, 664 del, 4023 sub ]&lt;br /&gt;
       notetp3: %WER 13.17 [ 244 / 1853, 10 ins, 26 del, 208 sub ]&lt;br /&gt;
       record1900: %WER 8.10 [ 963 / 11888, 217 ins, 299 del, 447 sub ]&lt;br /&gt;
       general: %WER 34.41 [ 12943 / 37619, 779 ins, 785 del, 11379 sub ]&lt;br /&gt;
       online1: %WER 33.02 [ 9388 / 28433, 522 ins, 1465 del, 7401 sub ]&lt;br /&gt;
       online2: %WER 25.99 [ 15363 / 59101, 873 ins, 2408 del, 12082 sub ]&lt;br /&gt;
       speedup: %WER 23.52 [ 1236 / 5255, 72 ins, 213 del, 951 sub ]&lt;br /&gt;
       ----&lt;br /&gt;
2,GFCC 100_1200_1200_1200_1200_3625&lt;br /&gt;
       map: %WER 22.95 [ 3357 / 14628, 109 ins, 471 del, 2777 sub ]&lt;br /&gt;
       2044: %WER 20.93 [ 4865 / 23241, 387 ins, 748 del, 3730 sub ]&lt;br /&gt;
       notetp3: %WER 15.43 [ 286 / 1853, 41 ins, 26 del, 219 sub ]&lt;br /&gt;
       record1900: %WER 7.32 [ 870 / 11888, 107 ins, 266 del, 497 sub ]&lt;br /&gt;
       general: %WER 31.57 [ 11878 / 37619, 587 ins, 861 del, 10430 sub ]&lt;br /&gt;
       online1: %WER 31.83 [ 9049 / 28433, 519 ins, 1506 del, 7024 sub ]&lt;br /&gt;
       online2: %WER 25.20 [ 14894 / 59101, 839 ins, 2434 del, 11621 sub ]&lt;br /&gt;
       speedup: %WER 22.97 [ 1207 / 5255, 73 ins, 221 del, 913 sub ]&lt;br /&gt;
       ----&lt;br /&gt;
&lt;br /&gt;
White noise added into the test data:&lt;br /&gt;
&lt;br /&gt;
1,NOISE LEVEL:about 15db&lt;br /&gt;
  1) MFCC 100_1200_1200_1200_1200_3580&lt;br /&gt;
    map: %WER 65.24 [ 9544 / 14628, 48 ins, 2841 del, 6655 sub ]&lt;br /&gt;
    2044: %WER 48.93 [ 11372 / 23241, 176 ins, 2803 del, 8393 sub ]&lt;br /&gt;
    notetp3: %WER 55.91 [ 1036 / 1853, 9 ins, 476 del, 551 sub ]&lt;br /&gt;
    record1900: %WER 25.43 [ 3023 / 11888, 27 ins, 1387 del, 1609 sub ]&lt;br /&gt;
    general: %WER 70.05 [ 26352 / 37619, 141 ins, 5336 del, 20875 sub ]&lt;br /&gt;
    online1: %WER 50.40 [ 14329 / 28433, 431 ins, 3827 del, 10071 sub ]&lt;br /&gt;
    online2: %WER 48.45 [ 28632 / 59101, 664 ins, 7930 del, 20038 sub ]&lt;br /&gt;
    speedup: %WER 64.78 [ 3404 / 5255, 13 ins, 1084 del, 2307 sub ]&lt;br /&gt;
    ----&lt;br /&gt;
  2)GFCC 100_1200_1200_1200_1200_3625&lt;br /&gt;
    map: %WER 62.99 [ 9214 / 14628, 63 ins, 3113 del, 6038 sub ]&lt;br /&gt;
    2044: %WER 46.34 [ 10769 / 23241, 251 ins, 2897 del, 7621 sub ]&lt;br /&gt;
    notetp3: %WER 52.46 [ 972 / 1853, 18 ins, 545 del, 409 sub ]&lt;br /&gt;
    record1900: %WER 26.62 [ 3164 / 11888, 133 ins, 1181 del, 1850 sub ]&lt;br /&gt;
    general: %WER 66.04 [ 24843 / 37619, 404 ins, 5277 del, 19162 sub ]&lt;br /&gt;
    online1: %WER 46.61 [ 13254 / 28433, 466 ins, 3725 del, 9063 sub ]&lt;br /&gt;
    online2: %WER 44.49 [ 26292 / 59101, 813 ins, 7552 del, 17927 sub ]&lt;br /&gt;
    speedup: %WER 60.38 [ 3173 / 5255, 25 ins, 1061 del, 2087 sub ]&lt;br /&gt;
&lt;br /&gt;
&amp;lt;/pre&amp;gt; &lt;br /&gt;
&lt;br /&gt;
&lt;br /&gt;
&lt;br /&gt;
==Stream decoding==&lt;br /&gt;
&lt;br /&gt;
* The interface for server-side is done. For embedded-side is on development. &lt;br /&gt;
&lt;br /&gt;
To do:&lt;br /&gt;
* global CMN initialization.&lt;br /&gt;
&lt;br /&gt;
&lt;br /&gt;
==Subgraph integration==&lt;br /&gt;
&lt;br /&gt;
* Compress subgraph HCLG is done. The integration is around 1-2 seconds. &lt;br /&gt;
* G.fst integration encounters a problem: after G+L, determinization is halted. &lt;br /&gt;
&lt;br /&gt;
&lt;br /&gt;
== Embedded progress ==&lt;br /&gt;
&lt;br /&gt;
* GFCC-based engine test. Just started.&lt;/div&gt;</summary>
		<author><name>Cslt</name></author>	</entry>

	</feed>