<html xmlns="http://www.w3.org/1999/xhtml">
<head>
<meta charset="utf-8">
<meta name="generator" content="pdf2htmlEX">
<meta http-equiv="X-UA-Compatible" content="IE=edge,chrome=1">
<link rel="stylesheet" href="https://static.pudn.com/base/css/base.min.css">
<link rel="stylesheet" href="https://static.pudn.com/base/css/fancy.min.css">
<link rel="stylesheet" href="https://static.pudn.com/prod/directory_preview_static/6250997e74bc5c01056b6b60/raw.css">
<script src="https://static.pudn.com/base/js/compatibility.min.js"></script>
<script src="https://static.pudn.com/base/js/pdf2htmlEX.min.js"></script>
<script>
try{
pdf2htmlEX.defaultViewer = new pdf2htmlEX.Viewer({});
}catch(e){}
</script>
<title></title>
</head>
<body>
<div id="sidebar" style="display: none">
<div id="outline">
</div>
</div>
<div id="pf1" class="pf w0 h0" data-page-no="1"><div class="pc pc1 w0 h0"><img class="bi x0 y0 w1 h1" alt="" src="https://static.pudn.com/prod/directory_preview_static/6250997e74bc5c01056b6b60/bg1.jpg"><div class="t m0 x1 h2 y1 ff1 fs0 fc0 sc0 ls0 ws0"> </div><div class="t m0 x2 h3 y2 ff1 fs1 fc0 sc0 ls0 ws0"> <span class="_ _0"></span>·<span class="_ _1"></span><span class="ff2 fs2">47<span class="_ _2"></span>0<span class="_ _3"> </span><span class="ff1 fs1">·<span class="_ _0"></span>     </span></span></div><div class="t m0 x3 h2 y3 ff1 fs0 fc0 sc0 ls0 ws0">计<span class="_ _4"></span>算<span class="_ _4"></span>机<span class="_ _5"></span>测<span class="_ _5"></span>量<span class="_ _4"></span>与<span class="_ _5"></span>控<span class="_ _4"></span>制<span class="_ _6"> </span><span class="ff2 fs3">.<span class="_ _7"> </span>2<span class="_ _5"></span>0<span class="_ _5"></span>0<span class="_ _5"></span>4<span class="_ _6"> </span>.<span class="_ _7"> </span>1<span class="_ _5"></span>2</span></div><div class="t m0 x4 h4 y4 ff2 fs3 fc0 sc0 ls0 ws0">(</div><div class="t m0 x5 h4 y3 ff2 fs3 fc0 sc0 ls0 ws0">5</div><div class="t m0 x6 h4 y4 ff2 fs3 fc0 sc0 ls0 ws0">)</div><div class="t m0 x7 h2 y3 ff1 fs0 fc0 sc0 ls0 ws0"> </div><div class="t m0 x3 h5 y5 ff3 fs3 fc0 sc0 ls0 ws0">C<span class="_ _2"></span>om<span class="_ _2"></span>p<span class="_ _2"></span>u<span class="_ _8"></span>te<span class="_ _2"></span>r<span class="_ _9"> </span>M<span class="_ _8"></span>e<span class="_ _2"></span>a<span class="_ _a"></span>su<span class="_ _8"></span>rem<span class="_ _8"></span>ent<span class="_ _b"> </span>&<span class="_ _c"> </span>C<span class="_ _8"></span>o<span class="_ _2"></span>nt<span class="_ _2"></span>ro<span class="_ _2"></span>l<span class="_ _6"> </span><span class="ff1 fs0"> </span></div><div class="t m0 x8 h6 y6 ff4 fs4 fc0 sc0 ls0 ws0">设<span class="_ _2"></span>计<span class="_ _2"></span>与应<span class="_ _8"></span>用</div><div class="t m0 x9 h2 y7 ff4 fs0 fc0 sc0 ls0 ws0">收稿日期<span class="_ _d"> </span><span class="ff2 fs3">:200<span class="_ _2"></span>3<span class="_"> </span>-<span class="_ _e"> </span>08<span class="_"> </span>-<span class="_ _e"> </span>1<span class="_ _2"></span>0</span></div><div class="t m0 x9 h2 y8 ff4 fs0 fc0 sc0 ls0 ws0">基金项目<span class="_ _d"> </span><span class="ff2 fs3">:<span class="_ _a"></span></span><span class="ff1">山西省自然科学基金资助项目</span></div><div class="t m0 x9 h2 y9 ff4 fs0 fc0 sc0 ls0 ws0">作<span class="_ _2"></span>者简介<span class="_ _d"> </span><span class="ff2 fs3">:<span class="_ _4"></span></span><span class="ff1">郭<span class="_ _5"></span>圣<span class="_ _5"></span>权</span></div><div class="t m0 xa h4 ya ff2 fs3 fc0 sc0 ls0 ws0">(</div><div class="t m0 xb h4 y9 ff2 fs3 fc0 sc0 ls0 ws0">19<span class="_ _2"></span>3<span class="_ _2"></span>9<span class="_ _3"> </span>-</div><div class="t m0 xc h4 ya ff2 fs3 fc0 sc0 ls0 ws0">)</div><div class="t m0 xd h2 y9 ff2 fs3 fc0 sc0 ls0 ws0">,<span class="_ _5"></span><span class="ff1 fs0">男<span class="_ _7"> </span></span>,<span class="_ _a"></span><span class="ff1 fs0">山<span class="_ _5"></span>西<span class="_ _5"></span>省<span class="_ _5"></span>定<span class="_ _5"></span>襄<span class="_ _5"></span>县<span class="_ _5"></span>人<span class="_ _7"> </span></span>,<span class="_ _5"></span><span class="ff1 fs0">教</span></div><div class="t m0 xe h2 yb ff1 fs0 fc0 sc0 ls0 ws0">授<span class="_ _7"> </span><span class="ff2 fs3">,</span>主要从事导航<span class="_ _4"></span>、<span class="_ _f"></span>制导及语音识别在导航定位系统中的应</div><div class="t m0 xe h2 yc ff1 fs0 fc0 sc0 ls0 ws0">用<span class="_ _4"></span>。</div><div class="t m0 xe h2 yd ff4 fs0 fc0 sc0 ls0 ws0">文章编号<span class="_ _d"> </span><span class="ff2 fs3">:16<span class="_ _2"></span>71<span class="_"> </span>-<span class="_ _e"> </span>4<span class="_ _2"></span>59<span class="_ _2"></span>8</span></div><div class="t m0 xf h4 ye ff2 fs3 fc0 sc0 ls0 ws0">(</div><div class="t m0 x10 h4 yd ff2 fs3 fc0 sc0 ls0 ws0">20<span class="_ _2"></span>0<span class="_ _2"></span>4</div><div class="t m0 x11 h4 ye ff2 fs3 fc0 sc0 ls0 ws0">)</div><div class="t m0 x12 h2 yd ff2 fs3 fc0 sc0 ls0 ws0">05<span class="_"> </span>-<span class="_ _e"> </span>0<span class="_ _2"></span>47<span class="_ _2"></span>0<span class="_"> </span>-<span class="_ _e"> </span>03<span class="_ _6"> </span><span class="ff4 fs0">      <span class="_ _1"></span>中图分类号<span class="_ _6"> </span><span class="ff2 fs3">:<span class="_ _4"></span>T<span class="_ _8"></span>P<span class="_ _8"></span>3<span class="_ _2"></span>1<span class="_"> </span><span class="ff4 fs0">      <span class="_ _0"></span>文献标识码<span class="_ _d"> </span><span class="ff2 fs3">:B</span></span></span></span></div><div class="t m0 x13 h7 yf ff3 fs5 fc0 sc0 ls0 ws0">MA<span class="_ _5"></span>T<span class="_ _10"></span>L<span class="_ _6"></span>A<span class="_ _a"></span>B<span class="_ _e"> </span><span class="ff4 fs6">环境下的基于<span class="_ _11"> </span></span>H<span class="_ _0"></span>M<span class="_ _2"></span>M<span class="_"> </span><span class="ff4 fs6">模型的语音识别系统</span></div><div class="t m0 x14 h8 y10 ff1 fs7 fc0 sc0 ls0 ws0">郭圣权<span class="_ _12"> </span><span class="ff2 fs8">,<span class="_ _13"> </span></span>连晓峰</div><div class="t m0 x3 h4 y11 ff2 fs3 fc0 sc0 ls0 ws0">(</div><div class="t m0 x15 h2 y12 ff1 fs0 fc0 sc0 ls0 ws0">华北工学院<span class="_ _3"> </span>自动控制系<span class="_ _14"> </span><span class="ff2 fs3">,<span class="_ _c"> </span></span>山西<span class="_ _3"> </span>太原<span class="_ _14"> </span> <span class="_ _0"></span><span class="ff2 fs3">030<span class="_ _2"></span>0<span class="_ _2"></span>51</span></div><div class="t m0 x16 h4 y11 ff2 fs3 fc0 sc0 ls0 ws0">)</div><div class="t m0 x17 h2 y13 ff4 fs0 fc0 sc0 ls0 ws0">摘要<span class="_ _6"> </span><span class="ff2 fs3">:<span class="_ _15"> </span></span><span class="ff1">在<span class="_ _d"> </span><span class="ff2 fs3">M<span class="_ _16"></span>AT<span class="_ _1"></span>L<span class="_ _2"></span>A<span class="_ _16"></span>B<span class="_"> </span><span class="ff1 fs0">环境下利用语音工具箱<span class="_ _d"> </span></span>V<span class="_ _16"></span>oice<span class="_ _14"> </span>B<span class="_ _8"></span>ox<span class="_ _d"> </span><span class="ff1 fs0">实现基于<span class="_ _a"></span>连<span class="_ _a"></span>续概<span class="_ _a"></span>率<span class="_ _a"></span>密度<span class="_ _a"></span>隐<span class="_ _a"></span>含马<span class="_ _a"></span>尔<span class="_ _a"></span>科夫<span class="_ _a"></span>模<span class="_ _a"></span>型的<span class="_ _a"></span>汉<span class="_ _a"></span>语语<span class="_ _a"></span>音<span class="_ _a"></span>识别<span class="_ _a"></span>系<span class="_ _a"></span>统<span class="_ _4"></span>。<span class="_ _16"></span>在</span></span></span></div><div class="t m0 x9 h2 y14 ff1 fs0 fc0 sc0 ls0 ws0">实时录音的情况下<span class="_ _14"> </span><span class="ff2 fs3">,<span class="_ _c"> </span></span>利用该语音识别系统<span class="_ _7"> </span><span class="ff2 fs3">,<span class="_ _c"> </span></span>不同的人对<span class="_ _14"> </span><span class="ff2 fs3">20<span class="_"> </span></span>条<span class="_ _d"> </span><span class="ff2 fs3">2</span>~<span class="ff2 fs3">8<span class="_"> </span></span>个字的语音命令进行识别<span class="_ _14"> </span><span class="ff2 fs3">,<span class="_ _c"> </span></span>准确率<span class="_ _a"></span>可达<span class="_ _a"></span>到<span class="_ _14"> </span><span class="ff2 fs3">95<span class="_"> </span>%<span class="_"> </span>,<span class="_ _c"> </span></span>识别<span class="_ _a"></span>时间</div><div class="t m0 x9 h9 y15 ff2 fs3 fc0 sc0 ls0 ws0">1<span class="ff5 fs0">1<span class="_ _8"></span><span class="ff2 fs3">5<span class="ff1 fs0">~</span>3<span class="_ _3"> </span>s<span class="_"> </span>,<span class="_ _c"> </span><span class="ff1 fs0">实现了小词汇量连续语音的非特定人的实时识别<span class="_ _4"></span>。</span></span></span></div><div class="t m0 x17 h2 y16 ff4 fs0 fc0 sc0 ls0 ws0">关键词<span class="_ _d"> </span><span class="ff2 fs3">:<span class="_ _17"> </span></span><span class="ff1">语音识别<span class="_ _d"> </span><span class="ff2 fs3">;<span class="_ _c"> </span>M<span class="_ _16"></span>AT<span class="_ _1"></span>L<span class="_ _2"></span>A<span class="_ _16"></span>B<span class="_ _6"> </span>;<span class="_ _17"> </span><span class="ff1 fs0">连续概率密度隐含马尔科夫模型</span></span></span></div><div class="t m0 x18 h4 y17 ff2 fs3 fc0 sc0 ls0 ws0">(</div><div class="t m0 x19 h4 y16 ff2 fs3 fc0 sc0 ls0 ws0">C<span class="_ _16"></span>DH<span class="_ _16"></span>M<span class="_ _18"></span>M</div><div class="t m0 x1a h4 y17 ff2 fs3 fc0 sc0 ls0 ws0">)</div><div class="t m0 x1b ha y18 ff3 fs8 fc0 sc0 ls0 ws0">Sp<span class="_ _18"></span>eec<span class="_ _a"></span>h<span class="_ _9"> </span>R<span class="_ _1"></span>ecog<span class="_ _8"></span>n<span class="_ _a"></span>i<span class="_ _2"></span>t<span class="_ _a"></span>i<span class="_ _2"></span>o<span class="_ _8"></span>n<span class="_ _19"> </span>S<span class="_ _8"></span>ys<span class="_ _2"></span>te<span class="_ _a"></span>m<span class="_ _19"> </span>B<span class="_ _0"></span>a<span class="_ _4"></span>s<span class="_ _8"></span>e<span class="_ _5"></span>d<span class="_ _c"> </span>o<span class="_ _8"></span>n<span class="_ _13"> </span>H<span class="_ _18"></span>M<span class="_ _2"></span>M<span class="_ _17"> </span>i<span class="_ _16"></span>n<span class="_ _19"> </span>MA<span class="_ _a"></span>T<span class="_ _1"></span>L<span class="_ _4"></span>A<span class="_ _a"></span>B<span class="_ _17"> </span>E<span class="_ _18"></span>nvi<span class="_ _8"></span>r<span class="_ _a"></span>o<span class="_ _8"></span>n<span class="_ _5"></span>m<span class="_ _16"></span>ent</div><div class="t m0 x1c hb y19 ff2 fs1 fc0 sc0 ls0 ws0">G<span class="_ _18"></span>u<span class="_ _18"></span>o<span class="_ _e"> </span>S<span class="_ _8"></span>hen<span class="_ _8"></span>gq<span class="_ _2"></span>u<span class="_ _2"></span>an<span class="_"> </span>,<span class="_ _17"> </span>Lian<span class="_ _e"> </span>X<span class="_ _18"></span>ia<span class="_ _16"></span>o<span class="_ _8"></span>f<span class="_ _a"></span>en<span class="_ _2"></span>g</div><div class="t m0 x1d h4 y1a ff2 fs3 fc0 sc0 ls0 ws0">(</div><div class="t m0 x1e h2 y1b ff2 fs3 fc0 sc0 ls0 ws0">D<span class="_ _2"></span>e<span class="_ _8"></span>pt<span class="_ _5"></span>.<span class="_ _19"> </span>o<span class="_ _8"></span>f<span class="_ _3"> </span>Au<span class="_ _16"></span>t<span class="_ _2"></span>om<span class="_ _8"></span>a<span class="_ _2"></span>tic<span class="_ _3"> </span>C<span class="_ _18"></span>on<span class="_ _2"></span>tr<span class="_ _16"></span>ol<span class="_ _7"> </span>,<span class="_ _c"> </span>N<span class="_ _18"></span>o<span class="_ _a"></span>r<span class="_ _8"></span>t<span class="_ _a"></span>h<span class="_ _1a"> </span>C<span class="_ _8"></span>h<span class="_ _2"></span>ina<span class="_ _12"> </span>I<span class="_ _8"></span>ns<span class="_ _8"></span>titu<span class="_ _8"></span>te<span class="_ _7"> </span>o<span class="_ _8"></span>f<span class="_ _e"> </span>T<span class="_ _16"></span>ech<span class="_ _2"></span>n<span class="_ _16"></span>ol<span class="_ _8"></span>og<span class="_ _8"></span>y<span class="_"> </span>,<span class="_ _17"> </span>T<span class="_ _16"></span>a<span class="_ _2"></span>iy<span class="_ _2"></span>u<span class="_ _2"></span>an<span class="_ _a"></span><span class="ff1 fs0"> <span class="_ _1b"></span><span class="ff2 fs3">03<span class="_ _2"></span>0<span class="_ _2"></span>05<span class="_ _2"></span>1<span class="_"> </span>,<span class="_ _17"> </span>C<span class="_ _2"></span>h<span class="_ _8"></span>i<span class="_ _a"></span>n<span class="_ _8"></span>a</span></span></div><div class="t m0 x1f h4 y1a ff2 fs3 fc0 sc0 ls0 ws0">)</div><div class="t m0 x17 h9 y1c ff3 fs3 fc0 sc0 ls0 ws0">A<span class="_ _2"></span>b<span class="_ _2"></span>s<span class="_ _2"></span>t<span class="_ _2"></span>r<span class="_ _8"></span>a<span class="_ _a"></span>ct<span class="_"> </span>:<span class="_ _3"> </span><span class="ff2">Us<span class="_ _16"></span>i<span class="_ _a"></span>n<span class="_ _8"></span>g<span class="_"> </span>V<span class="_ _16"></span>oic<span class="_ _2"></span>e<span class="_"> </span>-<span class="_ _3"> </span>B<span class="_ _8"></span>ox<span class="_ _14"> </span>a<span class="_ _3"> </span>m<span class="_ _16"></span>and<span class="_ _8"></span>ar<span class="_ _2"></span>in<span class="_ _3"> </span>s<span class="_ _16"></span>pee<span class="_ _2"></span>ch<span class="_ _1a"> </span>r<span class="_ _2"></span>ec<span class="_ _16"></span>og<span class="_ _8"></span>n<span class="_ _8"></span>iti<span class="_ _8"></span>on<span class="_ _3"> </span>s<span class="_ _8"></span>ys<span class="_ _16"></span>te<span class="_ _2"></span>m<span class="_"> </span>i<span class="_ _a"></span>s<span class="_ _1a"> </span>r<span class="_ _2"></span>ea<span class="_ _8"></span>li<span class="_ _2"></span>z<span class="_ _2"></span>ed<span class="_ _1a"> </span>b<span class="_ _8"></span>a<span class="_ _a"></span>s<span class="_ _16"></span>ed<span class="_"> </span>o<span class="_ _a"></span>n<span class="_ _7"> </span>C<span class="_ _16"></span>DH<span class="_ _18"></span>M<span class="_ _18"></span>M<span class="_"> </span>in<span class="_ _14"> </span>M<span class="_ _16"></span>A<span class="_ _18"></span>T<span class="_ _1b"></span>LA<span class="_ _18"></span>B<span class="_ _c"> </span>en<span class="_ _8"></span>v<span class="_ _16"></span>i<span class="_ _a"></span>r<span class="_ _16"></span>on<span class="_ _2"></span>m<span class="_ _16"></span>en<span class="_ _8"></span>t<span class="_ _5"></span>.<span class="_ _c"> </span>Un<span class="_ _2"></span>d<span class="_ _8"></span>er<span class="_ _1a"> </span>th<span class="_ _2"></span>e<span class="_ _1a"> </span>cir<span class="_ _10"></span><span class="ff5 fs0">2</span></span></div><div class="t m0 x9 h9 y1d ff2 fs3 fc0 sc0 ls0 ws0">cu<span class="_ _8"></span>m<span class="_ _2"></span>s<span class="_ _16"></span>t<span class="_ _a"></span>an<span class="_ _8"></span>ce<span class="_ _7"> </span>o<span class="_ _16"></span>f<span class="_ _3"> </span>t<span class="_ _a"></span>h<span class="_ _8"></span>e<span class="_ _1a"> </span>r<span class="_ _2"></span>ea<span class="_ _8"></span>l<span class="_ _7"> </span>-<span class="_ _12"> </span>tim<span class="_ _8"></span>e<span class="_ _7"> </span>re<span class="_ _2"></span>c<span class="_ _16"></span>ord<span class="_ _8"></span>i<span class="_ _a"></span>n<span class="_ _2"></span>g<span class="_ _6"> </span>,<span class="_ _17"> </span>d<span class="_ _8"></span>i<span class="_ _8"></span>f<span class="_ _8"></span>f<span class="_ _a"></span>e<span class="_ _2"></span>ren<span class="_ _16"></span>t<span class="_ _7"> </span>pe<span class="_ _8"></span>o<span class="_ _2"></span>ple<span class="_"> </span>t<span class="_ _8"></span>o<span class="_ _1a"> </span>s<span class="_ _2"></span>ay<span class="_ _6"> </span>t<span class="_ _a"></span>h<span class="_ _8"></span>e<span class="_ _7"> </span>c<span class="_ _8"></span>onn<span class="_ _8"></span>ec<span class="_ _8"></span>ted<span class="_"> </span>w<span class="_ _18"></span>ord<span class="_ _2"></span>s<span class="_ _6"> </span>w<span class="_ _8"></span>h<span class="_ _2"></span>ich<span class="_"> </span>in<span class="_ _2"></span>c<span class="_ _8"></span>l<span class="_ _a"></span>u<span class="_ _2"></span>d<span class="_ _2"></span>e<span class="_"> </span>2<span class="_ _1b"></span><span class="ff1 fs0">~<span class="ff2 fs3">8<span class="_ _6"> </span>w<span class="_ _18"></span>ords<span class="_ _d"> </span>in<span class="_"> </span>2<span class="_ _2"></span>0<span class="_ _7"> </span>s<span class="_ _16"></span>peech<span class="_"> </span>u<span class="_ _8"></span>tter<span class="_ _2"></span>an<span class="_ _8"></span>ces<span class="_"> </span>,<span class="_ _e"> </span>t<span class="_ _a"></span>h<span class="_ _8"></span>e<span class="_ _7"> </span>ac<span class="_ _2"></span>cu<span class="_ _2"></span>ra<span class="_ _18"></span><span class="ff5 fs0">2</span></span></span></div><div class="t m0 x9 h9 y1e ff2 fs3 fc0 sc0 ls0 ws0">cy<span class="_"> </span>can<span class="_ _7"> </span>rea<span class="_ _2"></span>ch<span class="_ _7"> </span>9<span class="_ _2"></span>5<span class="_"> </span>%<span class="_ _6"> </span>,<span class="_ _c"> </span>an<span class="_ _2"></span>d<span class="_ _7"> </span>t<span class="_ _a"></span>h<span class="_ _8"></span>e<span class="_ _3"> </span>re<span class="_ _2"></span>c<span class="_ _16"></span>og<span class="_ _2"></span>n<span class="_ _16"></span>iti<span class="_ _8"></span>on<span class="_ _7"> </span>tim<span class="_ _8"></span>e<span class="_ _7"> </span>i<span class="_ _a"></span>s<span class="_ _1a"> </span>b<span class="_ _2"></span>e<span class="_ _8"></span>tw<span class="_ _16"></span>een<span class="_"> </span>1<span class="_ _18"></span><span class="ff5 fs0">1<span class="_ _8"></span><span class="ff2 fs3">5<span class="ff1 fs0">~<span class="_ _8"></span><span class="ff2 fs3">3<span class="_ _3"> </span>s<span class="_ _2"></span>e<span class="_ _2"></span>c<span class="_ _16"></span>o<span class="_ _a"></span>n<span class="_ _2"></span>d<span class="_ _2"></span>s<span class="_ _7"> </span>in<span class="_ _7"> </span>t<span class="_ _a"></span>h<span class="_ _8"></span>i<span class="_ _a"></span>s<span class="_ _1a"> </span>s<span class="_ _8"></span>y<span class="_ _2"></span>s<span class="_ _16"></span>tem.</span></span></span></span></div><div class="t m0 x20 h5 y1f ff3 fs3 fc0 sc0 ls0 ws0">K<span class="_ _1c"></span>ey<span class="_ _e"> </span>w<span class="_ _16"></span>o<span class="_ _2"></span>r<span class="_ _a"></span>d<span class="_ _8"></span>s<span class="_"> </span>:<span class="_ _e"> </span><span class="ff2">s<span class="_ _16"></span>p<span class="_ _a"></span>ee<span class="_ _2"></span>ch<span class="_ _1a"> </span>rec<span class="_ _16"></span>og<span class="_ _2"></span>n<span class="_ _8"></span>iti<span class="_ _8"></span>on<span class="_ _6"> </span>;<span class="_ _17"> </span>M<span class="_ _16"></span>AT<span class="_ _1b"></span>LA<span class="_ _16"></span>B<span class="_ _6"> </span>;<span class="_ _15"> </span>C<span class="_ _18"></span>o<span class="_ _a"></span>n<span class="_ _8"></span>tinu<span class="_ _16"></span>o<span class="_ _8"></span><span class="ff1 fs0">’<span class="ff2 fs3">s<span class="_ _7"> </span>D<span class="_ _2"></span>ens<span class="_ _16"></span>ity<span class="_ _3"> </span>H<span class="_ _16"></span>i<span class="_ _a"></span>d<span class="_ _2"></span>d<span class="_ _2"></span>en<span class="_ _7"> </span>M<span class="_ _16"></span>ark<span class="_ _16"></span>ov<span class="_ _14"> </span>M<span class="_ _18"></span>o<span class="_ _a"></span>d<span class="_ _8"></span>el</span></span></span></div><div class="t m0 x21 h2 y20 ff1 fs0 fc0 sc0 ls0 ws0">图<span class="_ _14"> </span><span class="ff2 fs3">1<span class="_"> </span></span> <span class="_ _0"></span>语音输入与端点检测界面</div><div class="t m0 xe hc y21 ff3 fs9 fc0 sc0 ls0 ws0">0<span class="_"> </span><span class="ff4 fsa"> <span class="_ _0"></span>引言</span></div><div class="t m0 x22 hd y22 ff1 fsb fc0 sc0 ls0 ws0">目<span class="_ _8"></span>前<span class="_ _1a"> </span><span class="ff2 fs1">,<span class="_ _15"> </span></span>用<span class="_ _5"></span>于<span class="_ _5"></span>语<span class="_ _5"></span>音<span class="_ _5"></span>识<span class="_ _5"></span>别<span class="_ _5"></span>的<span class="_ _5"></span>方<span class="_ _5"></span>法<span class="_ _4"></span>有<span class="_ _5"></span>基<span class="_ _5"></span>于<span class="_ _5"></span>动<span class="_ _4"></span>态<span class="_ _5"></span>时<span class="_ _5"></span>轴<span class="_ _5"></span>归<span class="_ _4"></span>整</div><div class="t m0 x23 hb y23 ff2 fs1 fc0 sc0 ls0 ws0">(</div><div class="t m0 x24 hb y24 ff2 fs1 fc0 sc0 ls0 ws0">DT<span class="_ _18"></span>W</div><div class="t m0 x25 hb y23 ff2 fs1 fc0 sc0 ls0 ws0">)</div><div class="t m0 x17 hd y24 ff1 fsb fc0 sc0 ls0 ws0">技术的模板匹配法<span class="_ _4"></span>、<span class="_ _18"></span>基于概率统计的<span class="_ _12"> </span><span class="ff2 fs1">H<span class="_ _18"></span>M<span class="_ _18"></span>M<span class="_"> </span><span class="ff1 fsb">法和</span></span></div><div class="t m0 xe hd y25 ff1 fsb fc0 sc0 ls0 ws0">基于人工神经网络</div><div class="t m0 x26 hb y26 ff2 fs1 fc0 sc0 ls0 ws0">(</div><div class="t m0 x27 hb y25 ff2 fs1 fc0 sc0 ls0 ws0">A<span class="_ _16"></span>N<span class="_ _8"></span>N</div><div class="t m0 x28 hb y26 ff2 fs1 fc0 sc0 ls0 ws0">)</div><div class="t m0 x29 hd y25 ff1 fsb fc0 sc0 ls0 ws0">的最优搜索法<span class="_ _4"></span>。</div><div class="t m0 xe hc y27 ff3 fs9 fc0 sc0 ls0 ws0">1<span class="_"> </span><span class="ff4 fsa"> <span class="_ _0"></span>系统过程设计</span></div><div class="t m0 xe he y28 ff2 fs1 fc0 sc0 ls0 ws0">1<span class="ff5 fsb">1<span class="_ _2"></span><span class="ff2 fs1">1<span class="_"> </span><span class="ff1 fsb"> <span class="_ _0"></span>实时录音和端点检测控件</span></span></span></div><div class="t m0 x2a hf y29 ff2 fsc fc0 sc0 ls0 ws0">[<span class="_ _a"></span>1<span class="_ _4"> </span>]</div><div class="t m0 x22 hd y2a ff2 fs1 fc0 sc0 ls0 ws0">A<span class="_ _8"></span>ctiv<span class="_ _16"></span>e<span class="_ _a"></span>X<span class="_ _6"> </span><span class="ff1 fsb">控件是<span class="_ _14"> </span></span>M<span class="_ _16"></span>ic<span class="_ _a"></span>r<span class="_ _18"></span>o<span class="_ _a"></span>s<span class="_ _18"></span>o<span class="_ _8"></span>ft<span class="_ _1a"> </span><span class="ff1 fsb">公司制订的一种软件接口标</span></div><div class="t m0 xe hd y2b ff1 fsb fc0 sc0 ls0 ws0">准<span class="_ _7"> </span><span class="ff2 fs1">,<span class="_ _1d"> </span></span>在<span class="_ _14"> </span><span class="ff2 fs1">M<span class="_ _18"></span>AT<span class="_ _1"></span>L<span class="_ _2"></span>A<span class="_ _16"></span>B<span class="_"> </span><span class="ff1 fsb">中<span class="_ _1a"> </span></span>,<span class="_ _1d"> </span><span class="ff1 fsb">通常是将<span class="_ _7"> </span></span>A<span class="_ _2"></span>c<span class="_ _2"></span>tiv<span class="_ _8"></span>eX<span class="_ _14"> </span><span class="ff1 fsb">控<span class="_ _a"></span>件嵌<span class="_ _a"></span>入<span class="_ _a"></span>到<span class="_ _d"> </span></span>fi<span class="_ _a"></span>g<span class="_ _8"></span>ur<span class="_ _2"></span>e</span></div><div class="t m0 xe hd y2c ff1 fsb fc0 sc0 ls0 ws0">窗<span class="_ _2"></span>口中<span class="_ _7"> </span><span class="ff2 fs1">,<span class="_ _1d"> </span></span>以<span class="_ _e"> </span><span class="ff2 fs1">G<span class="_ _1b"></span>U<span class="_ _a"></span>I<span class="_"> </span><span class="ff1 fsb">程<span class="_ _a"></span>序<span class="_ _a"></span>的<span class="_ _a"></span>方<span class="_ _a"></span>式<span class="_ _a"></span>使<span class="_ _a"></span>用<span class="_ _6"></span>。<span class="_ _16"></span>通<span class="_ _a"></span>过<span class="_ _1a"> </span><span class="ff2 fs1">A<span class="_ _2"></span>c<span class="_ _2"></span>tiv<span class="_ _8"></span>e<span class="_ _a"></span>X<span class="_ _d"> </span><span class="ff1 fsb">录<span class="_ _a"></span>音<span class="_ _a"></span>控</span></span></span></span></div><div class="t m0 xe hd y2d ff1 fsb fc0 sc0 ls0 ws0">件可实现与<span class="_ _d"> </span><span class="ff2 fs1">M<span class="_ _16"></span>AT<span class="_ _1b"></span>LA<span class="_ _18"></span>B<span class="_ _1a"> </span><span class="ff1 fsb">主程序的双向交互<span class="_ _4"></span>。<span class="_ _18"></span>当<span class="_ _a"></span>录音控<span class="_ _a"></span>件录</span></span></div><div class="t m0 xe hd y2e ff1 fsb fc0 sc0 ls0 ws0">音完成并进行端点检测后<span class="_ _7"> </span><span class="ff2 fs1">,<span class="_ _1d"> </span></span>向主程序<span class="_ _a"></span>发送<span class="_ _a"></span>一个<span class="_ _a"></span>事件<span class="_ _7"> </span><span class="ff2 fs1">,<span class="_ _19"> </span></span>通</div><div class="t m0 xe hd y2f ff1 fsb fc0 sc0 ls0 ws0">知主程序读取语音数据及短时参数信<span class="_ _a"></span>息等<span class="_ _5"></span><span class="ff2 fs1">.<span class="_ _1e"> </span></span>端点<span class="_ _a"></span>检测<span class="_ _a"></span>算</div><div class="t m0 xe hd y30 ff1 fsb fc0 sc0 ls0 ws0">法主要采用短时平均能量和短时平均过<span class="_ _a"></span>零率<span class="_ _a"></span>作为判<span class="_ _a"></span>决的</div><div class="t m0 xe hd y31 ff1 fsb fc0 sc0 ls0 ws0">主要特征<span class="_ _4"></span>。</div><div class="t m0 x2b h10 y32 ff6 fsd fc0 sc0 ls0 ws0">e</div><div class="t m0 x13 h10 y33 ff6 fsd fc0 sc0 ls0 ws0">(</div><div class="t m0 x2c h10 y32 ff6 fsd fc0 sc0 ls0 ws0">i</div><div class="t m0 x20 h10 y33 ff6 fsd fc0 sc0 ls0 ws0">)</div><div class="t m0 x2d hd y32 ff2 fs1 fc0 sc0 ls0 ws0">=<span class="_ _1d"> </span><span class="ff1 fsb">∑</span></div><div class="t m0 x2e h11 y34 ff6 fse fc0 sc0 ls0 ws0">N</div><div class="t m0 x2f h12 y35 ff6 fse fc0 sc0 ls0 ws0">n<span class="_"> </span><span class="ff2 fsf">=<span class="_"> </span>1</span></div><div class="t m0 x30 hb y32 ff2 fs1 fc0 sc0 ls0 ws0">l<span class="_ _8"></span>og<span class="_ _6"></span><span class="ff6 fsd">x</span></div><div class="t m0 x31 hf y36 ff2 fsc fc0 sc0 ls0 ws0">2</div><div class="t m0 xf h13 y37 ff6 fs10 fc0 sc0 ls0 ws0">i</div><div class="t m0 x10 h10 y33 ff6 fsd fc0 sc0 ls0 ws0">(</div><div class="t m0 xb h10 y32 ff6 fsd fc0 sc0 ls0 ws0">n</div><div class="t m0 x32 h10 y33 ff6 fsd fc0 sc0 ls0 ws0">)</div><div class="t m0 x33 hd y32 ff1 fsb fc0 sc0 ls0 ws0"> <span class="_ _10"></span>计算第<span class="_ _c"> </span><span class="ff6 fsd">i<span class="_ _3"> </span></span>帧的短时能量<span class="_ _4"></span><span class="ff6 fsd">;</span></div><div class="t m0 x22 hb y38 ff2 fs1 fc0 sc0 ls0 ws0">z<span class="_ _2"></span>cr</div><div class="t m0 x2c h10 y39 ff6 fsd fc0 sc0 ls0 ws0">(</div><div class="t m0 x34 h10 y38 ff6 fsd fc0 sc0 ls0 ws0">i</div><div class="t m0 x35 h10 y39 ff6 fsd fc0 sc0 ls0 ws0">)</div><div class="t m0 x36 hd y38 ff2 fs1 fc0 sc0 ls0 ws0">=<span class="_ _1f"> </span><span class="ff1 fsb">∑</span></div><div class="t m0 x37 h12 y3a ff6 fse fc0 sc0 ls0 ws0">N<span class="_"> </span><span class="ff2 fsf">-<span class="_ _7"> </span>1</span></div><div class="t m0 x37 h12 y3b ff6 fse fc0 sc0 ls0 ws0">n<span class="_"> </span><span class="ff2 fsf">=<span class="_"> </span>1</span></div><div class="t m0 x38 hb y38 ff2 fs1 fc0 sc0 ls0 ws0">|<span class="_ _1d"> </span><span class="ff6 fsd">x</span></div><div class="t m0 x39 h13 y3c ff6 fs10 fc0 sc0 ls0 ws0">i</div><div class="t m0 x3a h10 y39 ff6 fsd fc0 sc0 ls0 ws0">(</div><div class="t m0 x27 h10 y38 ff6 fsd fc0 sc0 ls0 ws0">n</div><div class="t m0 x3b h10 y39 ff6 fsd fc0 sc0 ls0 ws0">)</div><div class="t m0 x3c hb y38 ff2 fs1 fc0 sc0 ls0 ws0">-<span class="_ _1f"> </span><span class="ff6 fsd">x</span></div><div class="t m0 x3d h13 y3c ff6 fs10 fc0 sc0 ls0 ws0">i</div><div class="t m0 xd h10 y39 ff6 fsd fc0 sc0 ls0 ws0">(</div><div class="t m0 x3e hb y38 ff6 fsd fc0 sc0 ls0 ws0">n<span class="_ _3"> </span><span class="ff2 fs1">+<span class="_"> </span>1</span></div><div class="t m0 x3f h10 y39 ff6 fsd fc0 sc0 ls0 ws0">)</div><div class="t m0 x40 hd y38 ff2 fs1 fc0 sc0 ls0 ws0">|<span class="_ _9"> </span><span class="ff1 fsb"> <span class="_ _1b"></span>计<span class="_ _a"></span>算第<span class="_ _17"> </span><span class="ff6 fsd">i<span class="_ _e"> </span></span>帧<span class="_ _a"></span>的</span></div><div class="t m0 xe hd y3d ff1 fsb fc0 sc0 ls0 ws0">过零率</div><div class="t m0 x22 hd y3e ff1 fsb fc0 sc0 ls0 ws0">本系<span class="_ _5"></span>统<span class="_ _5"></span>采<span class="_ _a"></span>用<span class="_ _12"> </span><span class="ff2 fs1">8<span class="_ _c"> </span>k<span class="_ _a"></span>H<span class="_ _18"></span>z<span class="_ _1a"> </span><span class="ff1 fsb">采<span class="_ _5"></span>样<span class="_ _5"></span>频<span class="_ _a"></span>率<span class="_ _6"></span>、<span class="_ _18"></span><span class="ff2 fs1">16<span class="_ _17"> </span>b<span class="_ _8"></span>it<span class="_ _6"> </span><span class="ff1 fsb">、<span class="_ _16"></span>单<span class="_ _5"></span>声<span class="_ _a"></span>道<span class="_ _5"></span>的</span></span></span></span></div><div class="t m0 xe hd y3f ff2 fs1 fc0 sc0 ls0 ws0">P<span class="_ _8"></span>C<span class="_ _18"></span>M<span class="_ _d"> </span><span class="ff1 fsb">录音格式<span class="_ _1a"> </span></span>,<span class="_ _1d"> </span><span class="ff1 fsb">帧长<span class="_ _e"> </span><span class="ff6 fsd">N<span class="_ _12"> </span></span>为<span class="_ _7"> </span></span>30<span class="_ _3"> </span>m<span class="_ _2"></span>s<span class="_"> </span>,<span class="_ _15"> </span><span class="ff1 fsb">帧移<span class="_ _e"> </span><span class="ff6 fsd">M<span class="_ _3"> </span></span>为<span class="_ _7"> </span></span>10<span class="_ _3"> </span>m<span class="_ _2"></span>s<span class="_"> </span>,</div><div class="t m0 x41 h10 y40 ff6 fsd fc0 sc0 ls0 ws0">x</div><div class="t m0 x42 h10 y41 ff6 fsd fc0 sc0 ls0 ws0">(</div><div class="t m0 x43 h10 y40 ff6 fsd fc0 sc0 ls0 ws0">n</div><div class="t m0 x44 h10 y41 ff6 fsd fc0 sc0 ls0 ws0">)</div><div class="t m0 x45 hd y40 ff1 fsb fc0 sc0 ls0 ws0">为输入<span class="_ _a"></span>的<span class="_ _a"></span>语<span class="_ _a"></span>音<span class="_ _a"></span>信<span class="_ _a"></span>号<span class="_ _d"> </span><span class="ff6 fsd">,<span class="_ _20"> </span>x<span class="_ _12"> </span></span>为<span class="_ _a"></span>第<span class="_ _3"> </span><span class="ff6 fsd">i<span class="_ _12"> </span></span>帧<span class="_ _a"></span>的<span class="_ _5"></span>第<span class="_ _3"> </span><span class="ff6 fsd">n<span class="_ _12"> </span></span>个<span class="_ _a"></span>样<span class="_ _a"></span>本<span class="_ _6"></span>。</div><div class="t m0 x46 hd y42 ff1 fsb fc0 sc0 ls0 ws0">系统界面如图<span class="_ _14"> </span><span class="ff2 fs1">1<span class="_ _1a"> </span></span>所示<span class="_ _4"></span>。</div><div class="t m0 x46 he y43 ff2 fs1 fc0 sc0 ls0 ws0">1<span class="ff5 fsb">1<span class="_ _2"></span><span class="ff2 fs1">2<span class="_"> </span><span class="ff1 fsb"> <span class="_ _0"></span>语音信号特征参数提取</span></span></span></div><div class="t m0 x47 hf y44 ff6 fs10 fc0 sc0 ls0 ws0">[<span class="_ _a"></span><span class="ff2 fsc">1<span class="_"> </span>-<span class="_ _1a"> </span>2<span class="_ _5"></span></span>]</div><div class="t m0 x48 hd y45 ff1 fsb fc0 sc0 ls0 ws0"> <span class="_ _2"></span> <span class="_ _5"></span>语音信<span class="_ _a"></span>号<span class="_ _5"></span>特<span class="_ _a"></span>征<span class="_ _a"></span>参<span class="_ _a"></span>数<span class="_ _a"></span>的<span class="_ _5"></span>提<span class="_ _a"></span>取<span class="_ _a"></span>是<span class="_ _a"></span>语<span class="_ _a"></span>音<span class="_ _5"></span>识<span class="_ _a"></span>别<span class="_ _a"></span>的<span class="_ _a"></span>一<span class="_ _a"></span>个<span class="_ _5"></span>重<span class="_ _a"></span>要</div><div class="t m0 x46 hd y46 ff1 fsb fc0 sc0 ls0 ws0">环节<span class="_ _4"></span>。<span class="_ _18"></span>目前常用的方法是基于人的发音<span class="_ _a"></span>器官<span class="_ _a"></span>建立<span class="_ _a"></span>声道<span class="_ _a"></span>模</div><div class="t m0 x46 hd y47 ff1 fsb fc0 sc0 ls0 ws0">型和基于听觉器官建立听觉模型<span class="_ _4"></span>。<span class="_ _18"></span>基于<span class="_ _a"></span>听觉<span class="_ _a"></span>模型<span class="_ _a"></span>得到<span class="_ _a"></span>的</div><div class="t m0 x46 hd y48 ff2 fs1 fc0 sc0 ls0 ws0">ME<span class="_ _1"></span>L<span class="_ _c"> </span><span class="ff1 fsb">倒<span class="_ _d"> </span>谱<span class="_ _6"> </span>系<span class="_ _d"> </span>数</span></div><div class="t m0 x16 hb y49 ff2 fs1 fc0 sc0 ls0 ws0">(</div><div class="t m0 x49 hb y48 ff2 fs1 fc0 sc0 ls0 ws0">M<span class="_ _16"></span>el<span class="_ _15"> </span>-<span class="_ _1e"> </span>F<span class="_ _2"></span>r<span class="_ _2"></span>equ<span class="_ _8"></span>e<span class="_ _a"></span>n<span class="_ _8"></span>cy<span class="_ _19"> </span>C<span class="_ _16"></span>e<span class="_ _2"></span>p<span class="_ _a"></span>s<span class="_ _8"></span>t<span class="_ _a"></span>ru<span class="_ _8"></span>m<span class="_ _19"> </span>C<span class="_ _1c"></span>oe<span class="_ _16"></span>f<span class="_ _8"></span>f<span class="_ _a"></span>ic<span class="_ _2"></span>ien<span class="_ _2"></span>t<span class="_ _a"></span>s<span class="_"> </span>,</div><div class="t m0 x46 hb y4a ff2 fs1 fc0 sc0 ls0 ws0">M<span class="_ _2"></span>F<span class="_ _8"></span>C<span class="_ _8"></span>C</div><div class="t m0 x4a hb y4b ff2 fs1 fc0 sc0 ls0 ws0">)</div><div class="t m0 x4b hd y4a ff1 fsb fc0 sc0 ls0 ws0">比基于声<span class="_ _a"></span>道<span class="_ _a"></span>模<span class="_ _a"></span>型<span class="_ _a"></span>得到<span class="_ _a"></span>的<span class="_ _7"> </span><span class="ff2 fs1">L<span class="_ _a"></span>P<span class="_ _2"></span>C<span class="_"> </span><span class="ff1 fsb">倒<span class="_ _a"></span>谱<span class="_ _a"></span>系<span class="_ _a"></span>数<span class="_ _a"></span>更<span class="_ _5"></span>符<span class="_ _a"></span>合<span class="_ _a"></span>人</span></span></div><div class="t m0 x46 hd y4c ff1 fsb fc0 sc0 ls0 ws0">耳的听觉特性<span class="_ _7"> </span><span class="ff2 fs1">,<span class="_ _1d"> </span></span>在有信道噪声和频谱<span class="_ _a"></span>失真<span class="_ _a"></span>的情<span class="_ _a"></span>况下<span class="_ _7"> </span><span class="ff2 fs1">,<span class="_ _19"> </span></span>能</div><div class="t m0 x46 hd y4d ff1 fsb fc0 sc0 ls0 ws0">产生更高的识别精度<span class="_ _4"></span>。</div><div class="t m0 x4c hd y4e ff2 fs1 fc0 sc0 ls0 ws0">M<span class="_ _2"></span>F<span class="_ _8"></span>C<span class="_ _8"></span>C<span class="_ _d"> </span><span class="ff1 fsb">建立在<span class="_ _3"> </span></span>F<span class="_ _1c"></span>o<span class="_ _a"></span>ur<span class="_ _8"></span>ier<span class="_"> </span><span class="ff1 fsb">频<span class="_ _a"></span>谱<span class="_ _a"></span>分<span class="_ _a"></span>析基<span class="_ _a"></span>础<span class="_ _a"></span>上<span class="_ _7"> </span></span>,<span class="_ _1d"> </span><span class="ff1 fsb">首<span class="_ _a"></span>先<span class="_ _a"></span>利用<span class="_ _a"></span>人</span></div><div class="t m0 x46 hd y4f ff1 fsb fc0 sc0 ls0 ws0">耳的感知特性<span class="_ _7"> </span><span class="ff2 fs1">,<span class="_ _1d"> </span></span>在语音的频谱范围内设<span class="_ _a"></span>置若<span class="_ _a"></span>干个<span class="_ _a"></span>带通<span class="_ _a"></span>滤</div><div class="t m0 x46 hd y50 ff1 fsb fc0 sc0 ls0 ws0">波器<span class="_ _7"> </span><span class="ff2 fs1">,<span class="_ _1d"> </span></span>每个滤波器具有三角形或正弦形滤波特性<span class="_ _1a"> </span><span class="ff2 fs1">,<span class="_ _15"> </span></span>然</div></div><div class="pi" data-data='{"ctm":[1.592040,0.000000,0.000000,1.592040,0.000000,0.000000]}'></div></div>
</body>
</html>