<efrbr:recordSet xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:efrbr="http://vfrbr.info/efrbr/1.1" xmlns:efrbr-work="http://vfrbr.info/efrbr/1.1/work" xmlns:efrbr-expression="http://vfrbr.info/efrbr/1.1/expression" xmlns:efrbr-manifestation="http://vfrbr.info/efrbr/1.1/manifestation" xmlns:efrbr-person="http://vfrbr.info/efrbr/1.1/person" xmlns:efrbr-corporateBody="http://vfrbr.info/efrbr/1.1/corporateBody" xmlns:efrbr-concept="http://vfrbr.info/efrbr/1.1/concept" xmlns:efrbr-structure="http://vfrbr.info/efrbr/1.1/structure" xmlns:efrbr-responsible="http://vfrbr.info/efrbr/1.1/responsible" xmlns:efrbr-subject="http://vfrbr.info/efrbr/1.1/subject" xmlns:efrbr-other="http://vfrbr.info/efrbr/1.1/other" xsi:schemaLocation="http://vfrbr.info/efrbr/1.1 http://vfrbr.info/schemas/1.1/efrbr.xsd"><efrbr:entities><efrbr-work:work identifier="http://purl.tuc.gr/dl/dias/04E5D722-6179-44E9-A174-4A2CA13F096E"><efrbr-work:titleOfTheWork>Maximum-likelihood stochastic-transformation adaptation of hidden Markov models</efrbr-work:titleOfTheWork></efrbr-work:work><efrbr-expression:expression identifier="http://purl.tuc.gr/dl/dias/04E5D722-6179-44E9-A174-4A2CA13F096E"><efrbr-expression:titleOfTheExpression>Maximum-likelihood stochastic-transformation adaptation of hidden Markov models</efrbr-expression:titleOfTheExpression><efrbr-expression:formOfExpression vocabulary="DIAS:TYPES">
            Peer-Reviewed Journal Publication
            Δημοσίευση σε Περιοδικό με Κριτές
         </efrbr-expression:formOfExpression><efrbr-expression:dateOfExpression type="issued">2015-11-02</efrbr-expression:dateOfExpression><efrbr-expression:dateOfExpression type="published">1999</efrbr-expression:dateOfExpression><efrbr-expression:languageOfExpression vocabulary="iso639-1">en</efrbr-expression:languageOfExpression><efrbr-expression:summarizationOfContent>The recognition accuracy in previous large vocabulary automatic speech recognition (ASR) systems is highly related to the existing mismatch between the training and testing sets. For example, dialect differences across the training and testing speakers result in a significant degradation in recognition performance. Some popular adaptation approaches improve the recognition performance of speech recognizers based on hidden Markov models with continuous mixture densities by using linear transformations to adapt the means, and possibly the covariances of the mixture Gaussians. The linear assumption, however, is too restrictive, and in this paper we propose a novel adaptation technique that adapts the means and, optionally, the covariances of the mixture Gaussians by using multiple stochastic transformations. We perform both speaker and dialect adaptation experiments, and we show that our method significantly improves the recognition accuracy and the robustness of our system. The experiments are carried out with SRI's DECIPHER speech recognition system</efrbr-expression:summarizationOfContent><efrbr-expression:useRestrictionsOnTheExpression type="creative-commons">http://creativecommons.org/licenses/by/4.0/</efrbr-expression:useRestrictionsOnTheExpression><efrbr-expression:note type="journal name">IEEE Transactions Speech and Audio Processing</efrbr-expression:note><efrbr-expression:note type="journal volume">7</efrbr-expression:note><efrbr-expression:note type="journal number">2</efrbr-expression:note><efrbr-expression:note type="page range">177-187</efrbr-expression:note></efrbr-expression:expression><efrbr-person:person identifier="http://users.isc.tuc.gr/~vdiakoloukas"><efrbr-person:nameOfPerson vocabulary="TUC:LDAP">
            Diakoloukas Vasilis
            Διακολουκας Βασιλeioς
         </efrbr-person:nameOfPerson></efrbr-person:person><efrbr-person:person identifier="http://users.isc.tuc.gr/~vdigalakis"><efrbr-person:nameOfPerson vocabulary="TUC:LDAP">
            Digalakis Vasilis
            Διγαλακης Βασιλης
         </efrbr-person:nameOfPerson></efrbr-person:person><efrbr-corporateBody:corporateBody identifier="http://www.ieee.org/index.html"><efrbr-corporateBody:nameOfTheCorporateBody vocabulary="S/R:PUBLISHERS">
            Institute of Electrical and Electronics Engineers
         </efrbr-corporateBody:nameOfTheCorporateBody></efrbr-corporateBody:corporateBody><efrbr-concept:concept identifier="1D11FC1F-88FB-4118-BF33-E04E087DC583"><efrbr-concept:termForTheConcept>
            Speech recognition
         </efrbr-concept:termForTheConcept></efrbr-concept:concept></efrbr:entities><efrbr:relationships><efrbr-structure:structureRelations><efrbr-structure:realizedThrough sourceEntity="work" sourceURI="http://purl.tuc.gr/dl/dias/04E5D722-6179-44E9-A174-4A2CA13F096E" targetEntity="expression" targetURI="http://purl.tuc.gr/dl/dias/04E5D722-6179-44E9-A174-4A2CA13F096E"/></efrbr-structure:structureRelations><efrbr-responsible:responsibleRelations><efrbr-responsible:createdBy sourceEntity="work" sourceURI="http://purl.tuc.gr/dl/dias/04E5D722-6179-44E9-A174-4A2CA13F096E" targetEntity="person" targetURI="http://users.isc.tuc.gr/~vdiakoloukas"/><efrbr-responsible:realizedBy sourceEntity="expression" sourceURI="http://purl.tuc.gr/dl/dias/04E5D722-6179-44E9-A174-4A2CA13F096E" targetEntity="person" targetURI="http://users.isc.tuc.gr/~vdiakoloukas" role="author"/><efrbr-responsible:realizedBy sourceEntity="expression" sourceURI="http://purl.tuc.gr/dl/dias/04E5D722-6179-44E9-A174-4A2CA13F096E" targetEntity="person" targetURI="http://users.isc.tuc.gr/~vdigalakis" role="author"/><efrbr-responsible:realizedBy sourceEntity="expression" sourceURI="http://purl.tuc.gr/dl/dias/04E5D722-6179-44E9-A174-4A2CA13F096E" targetEntity="person" targetURI="http://www.ieee.org/index.html" role="publisher"/></efrbr-responsible:responsibleRelations><efrbr-subject:subjectRelations><efrbr-subject:hasSubject sourceEntity="work" sourceURI="http://purl.tuc.gr/dl/dias/04E5D722-6179-44E9-A174-4A2CA13F096E" targetEntity="concept" targetURI="1D11FC1F-88FB-4118-BF33-E04E087DC583"/></efrbr-subject:subjectRelations><efrbr-other:otherRelations/></efrbr:relationships></efrbr:recordSet>