<efrbr:recordSet xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:efrbr="http://vfrbr.info/efrbr/1.1" xmlns:efrbr-work="http://vfrbr.info/efrbr/1.1/work" xmlns:efrbr-expression="http://vfrbr.info/efrbr/1.1/expression" xmlns:efrbr-manifestation="http://vfrbr.info/efrbr/1.1/manifestation" xmlns:efrbr-person="http://vfrbr.info/efrbr/1.1/person" xmlns:efrbr-corporateBody="http://vfrbr.info/efrbr/1.1/corporateBody" xmlns:efrbr-concept="http://vfrbr.info/efrbr/1.1/concept" xmlns:efrbr-structure="http://vfrbr.info/efrbr/1.1/structure" xmlns:efrbr-responsible="http://vfrbr.info/efrbr/1.1/responsible" xmlns:efrbr-subject="http://vfrbr.info/efrbr/1.1/subject" xmlns:efrbr-other="http://vfrbr.info/efrbr/1.1/other" xsi:schemaLocation="http://vfrbr.info/efrbr/1.1 http://vfrbr.info/schemas/1.1/efrbr.xsd"><efrbr:entities><efrbr-work:work identifier="http://purl.tuc.gr/dl/dias/A1FB74B4-8B64-46FA-B0AE-941918F57F06"><efrbr-work:titleOfTheWork>Variational denoising autoencoders and least-squares policy iteration for statistical dialogue managers</efrbr-work:titleOfTheWork></efrbr-work:work><efrbr-expression:expression identifier="http://purl.tuc.gr/dl/dias/A1FB74B4-8B64-46FA-B0AE-941918F57F06"><efrbr-expression:titleOfTheExpression>Variational denoising autoencoders and least-squares policy iteration for statistical dialogue managers</efrbr-expression:titleOfTheExpression><efrbr-expression:formOfExpression vocabulary="DIAS:TYPES">
            Peer-Reviewed Journal Publication
            Δημοσίευση σε Περιοδικό με Κριτές
         </efrbr-expression:formOfExpression><efrbr-expression:dateOfExpression type="issued">2021-09-27</efrbr-expression:dateOfExpression><efrbr-expression:dateOfExpression type="published">2020</efrbr-expression:dateOfExpression><efrbr-expression:languageOfExpression vocabulary="iso639-1">en</efrbr-expression:languageOfExpression><efrbr-expression:summarizationOfContent>The use of Reinforcement Learning (RL) approaches for dialogue policy optimization has been the new trend for dialogue management systems. Several methods have been proposed, which are trained on dialogue data to provide optimal system response. However, most of these approaches exhibit performance degradation in the presence of noise, poor scalability to other domains, as well as performance instabilities. To overcome these problems, we propose a novel approach based on the incremental, sample-efficient Least-Squares Policy Iteration (LSPI) algorithm, which is trained on compact, fixed-size dialogue state encodings, obtained from deep Variational Denoising Autoencoders (VDAE). The proposed scheme exhibits stable and noise-robust performance, which significantly outperforms the current state-of-the-art, even in mismatched noise environments.</efrbr-expression:summarizationOfContent><efrbr-expression:useRestrictionsOnTheExpression type="creative-commons">http://creativecommons.org/licenses/by/4.0/</efrbr-expression:useRestrictionsOnTheExpression><efrbr-expression:note type="journal name">IEEE Signal Processing Letters</efrbr-expression:note><efrbr-expression:note type="journal volume">27</efrbr-expression:note><efrbr-expression:note type="page range">960–964</efrbr-expression:note></efrbr-expression:expression><efrbr-person:person identifier="http://users.isc.tuc.gr/~vdiakoloukas"><efrbr-person:nameOfPerson vocabulary="TUC:LDAP">
            Diakoloukas Vasileios
            Διακολουκας Βασιλeioς
         </efrbr-person:nameOfPerson></efrbr-person:person><efrbr-person:person identifier="http://users.isc.tuc.gr/~flygerakis"><efrbr-person:nameOfPerson vocabulary="TUC:LDAP">
            Lygerakis Fotios
            Λυγερακης Φωτιος
         </efrbr-person:nameOfPerson></efrbr-person:person><efrbr-person:person identifier="http://users.isc.tuc.gr/~lagoudakis"><efrbr-person:nameOfPerson vocabulary="TUC:LDAP">
            Lagoudakis Michail
            Λαγουδακης Μιχαηλ
         </efrbr-person:nameOfPerson></efrbr-person:person><efrbr-person:person identifier="D98DBC60-3A88-49C5-8EBD-1E828485AEF2"><efrbr-person:nameOfPerson vocabulary="">
            Kotti Margarita
         </efrbr-person:nameOfPerson></efrbr-person:person><efrbr-corporateBody:corporateBody identifier="https://v2.sherpa.ac.uk/id/publisher/38"><efrbr-corporateBody:nameOfTheCorporateBody vocabulary="S/R:PUBLISHERS">
            Institute of Electrical and Electronics Engineers
         </efrbr-corporateBody:nameOfTheCorporateBody></efrbr-corporateBody:corporateBody><efrbr-concept:concept identifier="AA23DA51-61FB-4929-8F9A-FFB5DB4E4EAF"><efrbr-concept:termForTheConcept>
            Variational autoencoders
         </efrbr-concept:termForTheConcept></efrbr-concept:concept><efrbr-concept:concept identifier="6532B77F-9434-416B-9744-6053BFC56196"><efrbr-concept:termForTheConcept>
            Denoising
         </efrbr-concept:termForTheConcept></efrbr-concept:concept><efrbr-concept:concept identifier="78F960B7-DA9E-4294-A427-FCE72CA3E41A"><efrbr-concept:termForTheConcept>
            Dialogue systems
         </efrbr-concept:termForTheConcept></efrbr-concept:concept><efrbr-concept:concept identifier="01D3D7C1-1D0A-4BC5-9DD7-B0109D33E338"><efrbr-concept:termForTheConcept>
            Sample-efficient statistical dialogue managers
         </efrbr-concept:termForTheConcept></efrbr-concept:concept><efrbr-concept:concept identifier="44F084E7-F823-4AEC-9589-6B2EE0B131DC"><efrbr-concept:termForTheConcept>
            Least-squares policy iteration
         </efrbr-concept:termForTheConcept></efrbr-concept:concept></efrbr:entities><efrbr:relationships><efrbr-structure:structureRelations><efrbr-structure:realizedThrough sourceEntity="work" sourceURI="http://purl.tuc.gr/dl/dias/A1FB74B4-8B64-46FA-B0AE-941918F57F06" targetEntity="expression" targetURI="http://purl.tuc.gr/dl/dias/A1FB74B4-8B64-46FA-B0AE-941918F57F06"/></efrbr-structure:structureRelations><efrbr-responsible:responsibleRelations><efrbr-responsible:createdBy sourceEntity="work" sourceURI="http://purl.tuc.gr/dl/dias/A1FB74B4-8B64-46FA-B0AE-941918F57F06" targetEntity="person" targetURI="http://users.isc.tuc.gr/~vdiakoloukas"/><efrbr-responsible:realizedBy sourceEntity="expression" sourceURI="http://purl.tuc.gr/dl/dias/A1FB74B4-8B64-46FA-B0AE-941918F57F06" targetEntity="person" targetURI="http://users.isc.tuc.gr/~vdiakoloukas" role="author"/><efrbr-responsible:realizedBy sourceEntity="expression" sourceURI="http://purl.tuc.gr/dl/dias/A1FB74B4-8B64-46FA-B0AE-941918F57F06" targetEntity="person" targetURI="http://users.isc.tuc.gr/~flygerakis" role="author"/><efrbr-responsible:realizedBy sourceEntity="expression" sourceURI="http://purl.tuc.gr/dl/dias/A1FB74B4-8B64-46FA-B0AE-941918F57F06" targetEntity="person" targetURI="http://users.isc.tuc.gr/~lagoudakis" role="author"/><efrbr-responsible:realizedBy sourceEntity="expression" sourceURI="http://purl.tuc.gr/dl/dias/A1FB74B4-8B64-46FA-B0AE-941918F57F06" targetEntity="person" targetURI="D98DBC60-3A88-49C5-8EBD-1E828485AEF2" role="author"/><efrbr-responsible:realizedBy sourceEntity="expression" sourceURI="http://purl.tuc.gr/dl/dias/A1FB74B4-8B64-46FA-B0AE-941918F57F06" targetEntity="person" targetURI="https://v2.sherpa.ac.uk/id/publisher/38" role="publisher"/></efrbr-responsible:responsibleRelations><efrbr-subject:subjectRelations><efrbr-subject:hasSubject sourceEntity="work" sourceURI="http://purl.tuc.gr/dl/dias/A1FB74B4-8B64-46FA-B0AE-941918F57F06" targetEntity="concept" targetURI="AA23DA51-61FB-4929-8F9A-FFB5DB4E4EAF"/><efrbr-subject:hasSubject sourceEntity="work" sourceURI="http://purl.tuc.gr/dl/dias/A1FB74B4-8B64-46FA-B0AE-941918F57F06" targetEntity="concept" targetURI="6532B77F-9434-416B-9744-6053BFC56196"/><efrbr-subject:hasSubject sourceEntity="work" sourceURI="http://purl.tuc.gr/dl/dias/A1FB74B4-8B64-46FA-B0AE-941918F57F06" targetEntity="concept" targetURI="78F960B7-DA9E-4294-A427-FCE72CA3E41A"/><efrbr-subject:hasSubject sourceEntity="work" sourceURI="http://purl.tuc.gr/dl/dias/A1FB74B4-8B64-46FA-B0AE-941918F57F06" targetEntity="concept" targetURI="01D3D7C1-1D0A-4BC5-9DD7-B0109D33E338"/><efrbr-subject:hasSubject sourceEntity="work" sourceURI="http://purl.tuc.gr/dl/dias/A1FB74B4-8B64-46FA-B0AE-941918F57F06" targetEntity="concept" targetURI="44F084E7-F823-4AEC-9589-6B2EE0B131DC"/></efrbr-subject:subjectRelations><efrbr-other:otherRelations/></efrbr:relationships></efrbr:recordSet>