<efrbr:recordSet xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:efrbr="http://vfrbr.info/efrbr/1.1" xmlns:efrbr-work="http://vfrbr.info/efrbr/1.1/work" xmlns:efrbr-expression="http://vfrbr.info/efrbr/1.1/expression" xmlns:efrbr-manifestation="http://vfrbr.info/efrbr/1.1/manifestation" xmlns:efrbr-person="http://vfrbr.info/efrbr/1.1/person" xmlns:efrbr-corporateBody="http://vfrbr.info/efrbr/1.1/corporateBody" xmlns:efrbr-concept="http://vfrbr.info/efrbr/1.1/concept" xmlns:efrbr-structure="http://vfrbr.info/efrbr/1.1/structure" xmlns:efrbr-responsible="http://vfrbr.info/efrbr/1.1/responsible" xmlns:efrbr-subject="http://vfrbr.info/efrbr/1.1/subject" xmlns:efrbr-other="http://vfrbr.info/efrbr/1.1/other" xsi:schemaLocation="http://vfrbr.info/efrbr/1.1 http://vfrbr.info/schemas/1.1/efrbr.xsd"><efrbr:entities><efrbr-work:work identifier="http://purl.tuc.gr/dl/dias/D4893A56-E33D-4BDB-8414-A93DDC1A06E9"><efrbr-work:titleOfTheWork>Query analytics over probabilistic databases with unmerged duplicates</efrbr-work:titleOfTheWork></efrbr-work:work><efrbr-expression:expression identifier="http://purl.tuc.gr/dl/dias/D4893A56-E33D-4BDB-8414-A93DDC1A06E9"><efrbr-expression:titleOfTheExpression>Query analytics over probabilistic databases with unmerged duplicates</efrbr-expression:titleOfTheExpression><efrbr-expression:formOfExpression vocabulary="DIAS:TYPES">
            Peer-Reviewed Journal Publication
            Δημοσίευση σε Περιοδικό με Κριτές
         </efrbr-expression:formOfExpression><efrbr-expression:dateOfExpression type="issued">2015-10-29</efrbr-expression:dateOfExpression><efrbr-expression:dateOfExpression type="published">2015</efrbr-expression:dateOfExpression><efrbr-expression:languageOfExpression vocabulary="iso639-1">en</efrbr-expression:languageOfExpression><efrbr-expression:summarizationOfContent>Recent entity resolution approaches exhibit benefits when addressing the problem through unmerged duplicates: instances describing real-world objects are not merged based on apriori thresholds or human intervention, instead relevant resolution information is employed for evaluating resolution decisions during query processing using “possible worlds” semantics. In this paper, we present the first known approach for efficiently handling complex analytical queries over probabilistic databases with unmerged duplicates. We propose the ENTITY-JOIN operator that allows expressing complex aggregation and iceberg/top-k queries over joins between tables with unmerged duplicates and other database tables. Our technical content includes a novel indexing structure for efficient access to the entity resolution information and novel techniques for the efficient evaluation of complex probabilistic queries that retrieve analytical and summarized information over a (potentially, huge) collection of possible resolution worlds. Our extensive experimental evaluation verifies the benefits of our approach.</efrbr-expression:summarizationOfContent><efrbr-expression:useRestrictionsOnTheExpression type="creative-commons">http://creativecommons.org/licenses/by/4.0/</efrbr-expression:useRestrictionsOnTheExpression><efrbr-expression:note type="journal name">IEEE Transactions on Knowledge and Data Engineering</efrbr-expression:note><efrbr-expression:note type="journal volume">27</efrbr-expression:note><efrbr-expression:note type="journal number">8</efrbr-expression:note><efrbr-expression:note type="page range">2245-2260</efrbr-expression:note></efrbr-expression:expression><efrbr-person:person identifier="http://users.isc.tuc.gr/~aioannou"><efrbr-person:nameOfPerson vocabulary="TUC:LDAP">
            Ioannou Aikaterini
            Ιωαννου Αικατερινη
         </efrbr-person:nameOfPerson></efrbr-person:person><efrbr-person:person identifier="http://users.isc.tuc.gr/~mgarofalakis"><efrbr-person:nameOfPerson vocabulary="TUC:LDAP">
            Garofalakis Minos
            Γαροφαλακης Μινως
         </efrbr-person:nameOfPerson></efrbr-person:person><efrbr-corporateBody:corporateBody identifier="http://www.ieee.org/index.html"><efrbr-corporateBody:nameOfTheCorporateBody vocabulary="S/R:PUBLISHERS">
            Institute of Electrical and Electronics Engineers
         </efrbr-corporateBody:nameOfTheCorporateBody></efrbr-corporateBody:corporateBody><efrbr-concept:concept identifier="F2F91A75-B3E1-4B4D-AD19-A99AE158E4EF"><efrbr-concept:termForTheConcept>
            Couplings
         </efrbr-concept:termForTheConcept></efrbr-concept:concept><efrbr-concept:concept identifier="CBCDBF74-4EA7-4825-B02E-7E708A04C494"><efrbr-concept:termForTheConcept>
            Probabilistic logic
         </efrbr-concept:termForTheConcept></efrbr-concept:concept><efrbr-concept:concept identifier="A1E1344D-1346-4169-B40E-2B9D90F172A9"><efrbr-concept:termForTheConcept>
            Semantics
         </efrbr-concept:termForTheConcept></efrbr-concept:concept><efrbr-concept:concept identifier="0EFF2C2F-D00C-4381-835B-1872049BC4EB"><efrbr-concept:termForTheConcept>
            Indexing
         </efrbr-concept:termForTheConcept></efrbr-concept:concept><efrbr-concept:concept identifier="05082A00-0076-4ADE-A6D8-03922592DE78"><efrbr-concept:termForTheConcept>
            Data models
         </efrbr-concept:termForTheConcept></efrbr-concept:concept><efrbr-concept:concept identifier="D5632DFA-70B6-4BD6-8ABE-0C68C9F63585"><efrbr-concept:termForTheConcept>
            Aggregates
         </efrbr-concept:termForTheConcept></efrbr-concept:concept></efrbr:entities><efrbr:relationships><efrbr-structure:structureRelations><efrbr-structure:realizedThrough sourceEntity="work" targetEntity="expression" sourceURI="http://purl.tuc.gr/dl/dias/D4893A56-E33D-4BDB-8414-A93DDC1A06E9" targetURI="http://purl.tuc.gr/dl/dias/D4893A56-E33D-4BDB-8414-A93DDC1A06E9"/></efrbr-structure:structureRelations><efrbr-responsible:responsibleRelations><efrbr-responsible:createdBy sourceEntity="work" targetEntity="person" sourceURI="http://purl.tuc.gr/dl/dias/D4893A56-E33D-4BDB-8414-A93DDC1A06E9" targetURI="http://users.isc.tuc.gr/~aioannou"/><efrbr-responsible:realizedBy sourceEntity="expression" role="author" targetEntity="person" sourceURI="http://purl.tuc.gr/dl/dias/D4893A56-E33D-4BDB-8414-A93DDC1A06E9" targetURI="http://users.isc.tuc.gr/~aioannou"/><efrbr-responsible:realizedBy sourceEntity="expression" role="author" targetEntity="person" sourceURI="http://purl.tuc.gr/dl/dias/D4893A56-E33D-4BDB-8414-A93DDC1A06E9" targetURI="http://users.isc.tuc.gr/~mgarofalakis"/><efrbr-responsible:realizedBy sourceEntity="expression" role="publisher" targetEntity="person" sourceURI="http://purl.tuc.gr/dl/dias/D4893A56-E33D-4BDB-8414-A93DDC1A06E9" targetURI="http://www.ieee.org/index.html"/></efrbr-responsible:responsibleRelations><efrbr-subject:subjectRelations><efrbr-subject:hasSubject sourceEntity="work" targetEntity="concept" sourceURI="http://purl.tuc.gr/dl/dias/D4893A56-E33D-4BDB-8414-A93DDC1A06E9" targetURI="F2F91A75-B3E1-4B4D-AD19-A99AE158E4EF"/><efrbr-subject:hasSubject sourceEntity="work" targetEntity="concept" sourceURI="http://purl.tuc.gr/dl/dias/D4893A56-E33D-4BDB-8414-A93DDC1A06E9" targetURI="CBCDBF74-4EA7-4825-B02E-7E708A04C494"/><efrbr-subject:hasSubject sourceEntity="work" targetEntity="concept" sourceURI="http://purl.tuc.gr/dl/dias/D4893A56-E33D-4BDB-8414-A93DDC1A06E9" targetURI="A1E1344D-1346-4169-B40E-2B9D90F172A9"/><efrbr-subject:hasSubject sourceEntity="work" targetEntity="concept" sourceURI="http://purl.tuc.gr/dl/dias/D4893A56-E33D-4BDB-8414-A93DDC1A06E9" targetURI="0EFF2C2F-D00C-4381-835B-1872049BC4EB"/><efrbr-subject:hasSubject sourceEntity="work" targetEntity="concept" sourceURI="http://purl.tuc.gr/dl/dias/D4893A56-E33D-4BDB-8414-A93DDC1A06E9" targetURI="05082A00-0076-4ADE-A6D8-03922592DE78"/><efrbr-subject:hasSubject sourceEntity="work" targetEntity="concept" sourceURI="http://purl.tuc.gr/dl/dias/D4893A56-E33D-4BDB-8414-A93DDC1A06E9" targetURI="D5632DFA-70B6-4BD6-8ABE-0C68C9F63585"/></efrbr-subject:subjectRelations><efrbr-other:otherRelations/></efrbr:relationships></efrbr:recordSet>