<?xml version="1.0" encoding="UTF-8" ?>
<oai_dc:dc schemaLocation="http://www.openarchives.org/OAI/2.0/oai_dc/ http://www.openarchives.org/OAI/2.0/oai_dc.xsd">
<dc:title>Modeling, estimating, and compensating low-bit rate coding distortion in speech recognition</dc:title>
<dc:creator>Becerra-Yoma, Nestor</dc:creator>
<dc:creator>Silva-Sánchez, Jorge</dc:creator>
<dc:creator>Busso-Vyhmeister, Carlos</dc:creator>
<dc:creator>Busso-Vyhmeister, Carlos</dc:creator>
<dc:description>A solution to the problem of speech recognition with signals distorted by low-bit rate coders is presented in this paper. A model for the coding-decoding distortion, a HMM compensation method to include this model, and an EM-based adaptation algorithm to estimate this distortion are proposed here. Medium vocabulary continuous-speech speaker-independent recognition experiments with 8 kbps G.729(CS-CELP), 13 kbps RPE-LTP (GSM), 5.3 kbps G723.1, 4.8 kbps FS-1016 and 32 kbps G.726(ADPCM) coders show that the approach described in this paper is able to dramatically reduce the effect of the coding distortion and, in some cases, gives a word accuracy higher than the baseline system with uncoded speech. Finally, the EM estimation algorithm requires only one adapting utterance and the approach described is certainly suitable for dialogue systems where just a few adapting utterances are available.</dc:description>
<dc:date>2006</dc:date>
<dc:type>info:eu-repo/semantics/article</dc:type>
<dc:type>info:eu-repo/semantics/publishedVersion</dc:type>
<dc:identifier>http://hdl.handle.net/10533/197802</dc:identifier>
<dc:identifier>doi: 10.1109/TSA.2005.852994</dc:identifier>
<dc:identifier>wos: WOS:000235369100024</dc:identifier>
<dc:identifier>issn: 1063-6676</dc:identifier>
<dc:language>eng</dc:language>
<dc:relation>instname: Conicyt</dc:relation>
<dc:relation>reponame: Repositorio Digital RI2.0</dc:relation>
<dc:relation>instname: Conicyt</dc:relation>
<dc:relation>reponame: Repositorio Digital RI2.0</dc:relation>
<dc:relation>info:eu-repo/grantAgreement/Fondef/D02I1089</dc:relation>
<dc:relation>info:eu-repo/semantics/dataset/hdl.handle.net/10533/93477</dc:relation>
<dc:rights>info:eu-repo/semantics/openAccess</dc:rights>
<dc:source>IEEE TRANSACTIONS ON SPEECH AND AUDIO PROCESSING</dc:source>
<dc:source>reponame:Artículos CONICYT</dc:source>
<dc:source>instname:CONICYT Chile</dc:source>
<dc:source>instacron:CONICYT</dc:source>
<about>
<provenance>
<originDescription altered="" harvestDate="">
<datestamp>2020-01-27T14:04:19Z</datestamp>
<metadataNamespace>http://www.openarchives.org/OAI/2.0/oai_dc/</metadataNamespace>
<repositoryName>Artículos CONICYT - CONICYT Chile</repositoryName>
</originDescription>
</provenance>
</about>
</oai_dc:dc>
<?xml version="1.0" encoding="UTF-8" ?>
<metadata schemaLocation="http://www.lyncode.com/xoai http://www.lyncode.com/xsd/xoai.xsd">
<element name="dc">
<element name="title">
<element name="none">
<field name="value">Modeling, estimating, and compensating low-bit rate coding distortion in speech recognition</field>
</element>
</element>
<element name="creator">
<element name="none">
<field name="value">Becerra-Yoma, Nestor</field>
<field name="value">Silva-Sánchez, Jorge</field>
<field name="value">Busso-Vyhmeister, Carlos</field>
<field name="value">Busso-Vyhmeister, Carlos</field>
</element>
</element>
<element name="description">
<element name="none">
<field name="value">A solution to the problem of speech recognition with signals distorted by low-bit rate coders is presented in this paper. A model for the coding-decoding distortion, a HMM compensation method to include this model, and an EM-based adaptation algorithm to estimate this distortion are proposed here. Medium vocabulary continuous-speech speaker-independent recognition experiments with 8 kbps G.729(CS-CELP), 13 kbps RPE-LTP (GSM), 5.3 kbps G723.1, 4.8 kbps FS-1016 and 32 kbps G.726(ADPCM) coders show that the approach described in this paper is able to dramatically reduce the effect of the coding distortion and, in some cases, gives a word accuracy higher than the baseline system with uncoded speech. Finally, the EM estimation algorithm requires only one adapting utterance and the approach described is certainly suitable for dialogue systems where just a few adapting utterances are available.</field>
</element>
</element>
<element name="date">
<element name="none">
<field name="value">2006</field>
</element>
</element>
<element name="type">
<element name="none">
<field name="value">info:eu-repo/semantics/article</field>
<field name="value">info:eu-repo/semantics/publishedVersion</field>
</element>
</element>
<element name="identifier">
<element name="none">
<field name="value">http://hdl.handle.net/10533/197802</field>
<field name="value">doi: 10.1109/TSA.2005.852994</field>
<field name="value">wos: WOS:000235369100024</field>
<field name="value">issn: 1063-6676</field>
</element>
</element>
<element name="source">
<element name="none">
<field name="value">IEEE TRANSACTIONS ON SPEECH AND AUDIO PROCESSING</field>
<field name="value">reponame:Artículos CONICYT</field>
<field name="value">instname:CONICYT Chile</field>
<field name="value">instacron:CONICYT</field>
</element>
</element>
<element name="relation">
<element name="none">
<field name="value">instname: Conicyt</field>
<field name="value">reponame: Repositorio Digital RI2.0</field>
<field name="value">instname: Conicyt</field>
<field name="value">reponame: Repositorio Digital RI2.0</field>
<field name="value">info:eu-repo/grantAgreement/Fondef/D02I1089</field>
<field name="value">info:eu-repo/semantics/dataset/hdl.handle.net/10533/93477</field>
</element>
</element>
<element name="rights">
<element name="none">
<field name="value">info:eu-repo/semantics/openAccess</field>
</element>
</element>
<element name="language">
<element name="none">
<field name="value">eng</field>
</element>
</element>
</element>
<element name="others">
<field name="lastModifyDate">2020-01-27T14:04:19Z</field>
</element>
</metadata>