<efrbr:recordSet xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:efrbr="http://vfrbr.info/efrbr/1.1" xmlns:efrbr-work="http://vfrbr.info/efrbr/1.1/work" xmlns:efrbr-expression="http://vfrbr.info/efrbr/1.1/expression" xmlns:efrbr-manifestation="http://vfrbr.info/efrbr/1.1/manifestation" xmlns:efrbr-person="http://vfrbr.info/efrbr/1.1/person" xmlns:efrbr-corporateBody="http://vfrbr.info/efrbr/1.1/corporateBody" xmlns:efrbr-concept="http://vfrbr.info/efrbr/1.1/concept" xmlns:efrbr-structure="http://vfrbr.info/efrbr/1.1/structure" xmlns:efrbr-responsible="http://vfrbr.info/efrbr/1.1/responsible" xmlns:efrbr-subject="http://vfrbr.info/efrbr/1.1/subject" xmlns:efrbr-other="http://vfrbr.info/efrbr/1.1/other" xsi:schemaLocation="http://vfrbr.info/efrbr/1.1 http://vfrbr.info/schemas/1.1/efrbr.xsd"><efrbr:entities><efrbr-work:work identifier="http://purl.tuc.gr/dl/dias/184E3D0D-4DCB-48FA-BD04-F7F06DFA4ACA"><efrbr-work:titleOfTheWork>Speech understanding for spoken dialogue systems: from corpus harvesting to grammar rule induction</efrbr-work:titleOfTheWork></efrbr-work:work><efrbr-expression:expression identifier="http://purl.tuc.gr/dl/dias/184E3D0D-4DCB-48FA-BD04-F7F06DFA4ACA"><efrbr-expression:titleOfTheExpression>Speech understanding for spoken dialogue systems: from corpus harvesting to grammar rule induction</efrbr-expression:titleOfTheExpression><efrbr-expression:formOfExpression vocabulary="DIAS:TYPES">
            Peer-Reviewed Journal Publication
            Δημοσίευση σε Περιοδικό με Κριτές
         </efrbr-expression:formOfExpression><efrbr-expression:dateOfExpression type="issued">2019-11-14</efrbr-expression:dateOfExpression><efrbr-expression:dateOfExpression type="published">2018</efrbr-expression:dateOfExpression><efrbr-expression:languageOfExpression vocabulary="iso639-1">en</efrbr-expression:languageOfExpression><efrbr-expression:summarizationOfContent>We investigate algorithms and tools for the semi-automatic authoring of grammars for spoken dialogue systems (SDS) proposing a framework that spans from corpora creation to grammar induction algorithms. A realistic human-in-the-loop approach is followed balancing automation and human intervention to optimize cost to performance ratio for grammar development. Web harvesting is the main approach investigated for eliciting spoken dialogue textual data, while crowdsourcing is also proposed as an alternative method. Several techniques are presented for constructing web queries and filtering the acquired corpora. We also investigate how the harvested corpora can be used for the automatic and semi-automatic (human-in-the-loop) induction of grammar rules. SDS grammar rules and induction algorithms are grouped into two types, namely, low- and high-level. Two families of algorithms are investigated for rule induction: one based on semantic similarity and distributional semantic models, and the other using more traditional statistical modeling approaches (e.g., slot-filling algorithms using Conditional Random Fields). Evaluation results are presented for two domains and languages. High-level induction precision scores up to 60% are obtained. Results advocate the portability of the proposed features and algorithms across languages and domains.</efrbr-expression:summarizationOfContent><efrbr-expression:useRestrictionsOnTheExpression type="creative-commons">http://creativecommons.org/licenses/by/4.0/</efrbr-expression:useRestrictionsOnTheExpression><efrbr-expression:note type="journal name">Computer Speech and Language</efrbr-expression:note><efrbr-expression:note type="journal volume">47</efrbr-expression:note><efrbr-expression:note type="journal number">January 2018</efrbr-expression:note><efrbr-expression:note type="page range">272-297</efrbr-expression:note></efrbr-expression:expression><efrbr-person:person identifier="http://users.isc.tuc.gr/~eiosif"><efrbr-person:nameOfPerson vocabulary="TUC:LDAP">
            Iosif Ilias
            Ιωσηφ Ηλιας
         </efrbr-person:nameOfPerson></efrbr-person:person><efrbr-person:person identifier="http://users.isc.tuc.gr/~iklasinas"><efrbr-person:nameOfPerson vocabulary="TUC:LDAP">
            Klasinas Ioannis
            Κλασινας Ιωαννης
         </efrbr-person:nameOfPerson></efrbr-person:person><efrbr-person:person identifier="http://users.isc.tuc.gr/~gathanasopoulou"><efrbr-person:nameOfPerson vocabulary="TUC:LDAP">
            Athanasopoulou Georgia
            Αθανασοπουλου Γεωργια
         </efrbr-person:nameOfPerson></efrbr-person:person><efrbr-person:person identifier="http://users.isc.tuc.gr/~epalogiannidi"><efrbr-person:nameOfPerson vocabulary="TUC:LDAP">
            Palogiannidi Elisavet
            Παλογιαννιδη Ελισαβετ
         </efrbr-person:nameOfPerson></efrbr-person:person><efrbr-person:person identifier="http://users.isc.tuc.gr/~sgeorgiladakis"><efrbr-person:nameOfPerson vocabulary="TUC:LDAP">
            Georgiladakis Spyridon
            Γεωργιλαδακης Σπυριδων
         </efrbr-person:nameOfPerson></efrbr-person:person><efrbr-person:person identifier="E6C83D15-66BF-4CA9-AC02-5BC9D7BC0DBD"><efrbr-person:nameOfPerson vocabulary="">
            Louka Katerina
         </efrbr-person:nameOfPerson></efrbr-person:person><efrbr-person:person identifier="http://users.isc.tuc.gr/~apotamianos"><efrbr-person:nameOfPerson vocabulary="TUC:LDAP">
            Potamianos Alexandros
            Ποταμιανος Αλεξανδρος
         </efrbr-person:nameOfPerson></efrbr-person:person><efrbr-corporateBody:corporateBody identifier="http://www.elsevier.com/"><efrbr-corporateBody:nameOfTheCorporateBody vocabulary="S/R:PUBLISHERS">
            Elsevier
         </efrbr-corporateBody:nameOfTheCorporateBody></efrbr-corporateBody:corporateBody><efrbr-concept:concept identifier="67D00910-D63D-46D2-8E9C-466AC407840E"><efrbr-concept:termForTheConcept>
            Corpora creation
         </efrbr-concept:termForTheConcept></efrbr-concept:concept><efrbr-concept:concept identifier="929A9251-40A5-43F3-BE98-C08407D9324C"><efrbr-concept:termForTheConcept>
            Crowdsourcing
         </efrbr-concept:termForTheConcept></efrbr-concept:concept><efrbr-concept:concept identifier="380BF34F-A989-4C3F-B559-0F6C060438FC"><efrbr-concept:termForTheConcept>
            Grammar induction
         </efrbr-concept:termForTheConcept></efrbr-concept:concept><efrbr-concept:concept identifier="3531628B-C664-45A4-A0F6-FB8841FC353B"><efrbr-concept:termForTheConcept>
            Semantic similarity
         </efrbr-concept:termForTheConcept></efrbr-concept:concept><efrbr-concept:concept identifier="41C9F2C6-2017-4C87-9CCE-4C5274B2989F"><efrbr-concept:termForTheConcept>
            Spoken dialogue systems
         </efrbr-concept:termForTheConcept></efrbr-concept:concept><efrbr-concept:concept identifier="1DB7FDCB-27BD-4AEF-A141-880B7A16E118"><efrbr-concept:termForTheConcept>
            Web mining
         </efrbr-concept:termForTheConcept></efrbr-concept:concept></efrbr:entities><efrbr:relationships><efrbr-structure:structureRelations><efrbr-structure:realizedThrough sourceEntity="work" sourceURI="http://purl.tuc.gr/dl/dias/184E3D0D-4DCB-48FA-BD04-F7F06DFA4ACA" targetEntity="expression" targetURI="http://purl.tuc.gr/dl/dias/184E3D0D-4DCB-48FA-BD04-F7F06DFA4ACA"/></efrbr-structure:structureRelations><efrbr-responsible:responsibleRelations><efrbr-responsible:createdBy sourceEntity="work" sourceURI="http://purl.tuc.gr/dl/dias/184E3D0D-4DCB-48FA-BD04-F7F06DFA4ACA" targetEntity="person" targetURI="http://users.isc.tuc.gr/~eiosif"/><efrbr-responsible:realizedBy sourceEntity="expression" sourceURI="http://purl.tuc.gr/dl/dias/184E3D0D-4DCB-48FA-BD04-F7F06DFA4ACA" targetEntity="person" targetURI="http://users.isc.tuc.gr/~eiosif" role="author"/><efrbr-responsible:realizedBy sourceEntity="expression" sourceURI="http://purl.tuc.gr/dl/dias/184E3D0D-4DCB-48FA-BD04-F7F06DFA4ACA" targetEntity="person" targetURI="http://users.isc.tuc.gr/~iklasinas" role="author"/><efrbr-responsible:realizedBy sourceEntity="expression" sourceURI="http://purl.tuc.gr/dl/dias/184E3D0D-4DCB-48FA-BD04-F7F06DFA4ACA" targetEntity="person" targetURI="http://users.isc.tuc.gr/~gathanasopoulou" role="author"/><efrbr-responsible:realizedBy sourceEntity="expression" sourceURI="http://purl.tuc.gr/dl/dias/184E3D0D-4DCB-48FA-BD04-F7F06DFA4ACA" targetEntity="person" targetURI="http://users.isc.tuc.gr/~epalogiannidi" role="author"/><efrbr-responsible:realizedBy sourceEntity="expression" sourceURI="http://purl.tuc.gr/dl/dias/184E3D0D-4DCB-48FA-BD04-F7F06DFA4ACA" targetEntity="person" targetURI="http://users.isc.tuc.gr/~sgeorgiladakis" role="author"/><efrbr-responsible:realizedBy sourceEntity="expression" sourceURI="http://purl.tuc.gr/dl/dias/184E3D0D-4DCB-48FA-BD04-F7F06DFA4ACA" targetEntity="person" targetURI="E6C83D15-66BF-4CA9-AC02-5BC9D7BC0DBD" role="author"/><efrbr-responsible:realizedBy sourceEntity="expression" sourceURI="http://purl.tuc.gr/dl/dias/184E3D0D-4DCB-48FA-BD04-F7F06DFA4ACA" targetEntity="person" targetURI="http://users.isc.tuc.gr/~apotamianos" role="author"/><efrbr-responsible:realizedBy sourceEntity="expression" sourceURI="http://purl.tuc.gr/dl/dias/184E3D0D-4DCB-48FA-BD04-F7F06DFA4ACA" targetEntity="person" targetURI="http://www.elsevier.com/" role="publisher"/></efrbr-responsible:responsibleRelations><efrbr-subject:subjectRelations><efrbr-subject:hasSubject sourceEntity="work" sourceURI="http://purl.tuc.gr/dl/dias/184E3D0D-4DCB-48FA-BD04-F7F06DFA4ACA" targetEntity="concept" targetURI="67D00910-D63D-46D2-8E9C-466AC407840E"/><efrbr-subject:hasSubject sourceEntity="work" sourceURI="http://purl.tuc.gr/dl/dias/184E3D0D-4DCB-48FA-BD04-F7F06DFA4ACA" targetEntity="concept" targetURI="929A9251-40A5-43F3-BE98-C08407D9324C"/><efrbr-subject:hasSubject sourceEntity="work" sourceURI="http://purl.tuc.gr/dl/dias/184E3D0D-4DCB-48FA-BD04-F7F06DFA4ACA" targetEntity="concept" targetURI="380BF34F-A989-4C3F-B559-0F6C060438FC"/><efrbr-subject:hasSubject sourceEntity="work" sourceURI="http://purl.tuc.gr/dl/dias/184E3D0D-4DCB-48FA-BD04-F7F06DFA4ACA" targetEntity="concept" targetURI="3531628B-C664-45A4-A0F6-FB8841FC353B"/><efrbr-subject:hasSubject sourceEntity="work" sourceURI="http://purl.tuc.gr/dl/dias/184E3D0D-4DCB-48FA-BD04-F7F06DFA4ACA" targetEntity="concept" targetURI="41C9F2C6-2017-4C87-9CCE-4C5274B2989F"/><efrbr-subject:hasSubject sourceEntity="work" sourceURI="http://purl.tuc.gr/dl/dias/184E3D0D-4DCB-48FA-BD04-F7F06DFA4ACA" targetEntity="concept" targetURI="1DB7FDCB-27BD-4AEF-A141-880B7A16E118"/></efrbr-subject:subjectRelations><efrbr-other:otherRelations/></efrbr:relationships></efrbr:recordSet>