<efrbr:recordSet xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:efrbr="http://vfrbr.info/efrbr/1.1" xmlns:efrbr-work="http://vfrbr.info/efrbr/1.1/work" xmlns:efrbr-expression="http://vfrbr.info/efrbr/1.1/expression" xmlns:efrbr-manifestation="http://vfrbr.info/efrbr/1.1/manifestation" xmlns:efrbr-person="http://vfrbr.info/efrbr/1.1/person" xmlns:efrbr-corporateBody="http://vfrbr.info/efrbr/1.1/corporateBody" xmlns:efrbr-concept="http://vfrbr.info/efrbr/1.1/concept" xmlns:efrbr-structure="http://vfrbr.info/efrbr/1.1/structure" xmlns:efrbr-responsible="http://vfrbr.info/efrbr/1.1/responsible" xmlns:efrbr-subject="http://vfrbr.info/efrbr/1.1/subject" xmlns:efrbr-other="http://vfrbr.info/efrbr/1.1/other" xsi:schemaLocation="http://vfrbr.info/efrbr/1.1 http://vfrbr.info/schemas/1.1/efrbr.xsd"><efrbr:entities><efrbr-work:work identifier="http://purl.tuc.gr/dl/dias/9FBD290C-DC9B-419A-9A80-E532CB9521E0"><efrbr-work:titleOfTheWork>Hybrid in-database inference for declarative information extraction</efrbr-work:titleOfTheWork></efrbr-work:work><efrbr-expression:expression identifier="http://purl.tuc.gr/dl/dias/9FBD290C-DC9B-419A-9A80-E532CB9521E0"><efrbr-expression:titleOfTheExpression>Hybrid in-database inference for declarative information extraction</efrbr-expression:titleOfTheExpression><efrbr-expression:formOfExpression vocabulary="DIAS:TYPES">
            Πλήρης Δημοσίευση σε Συνέδριο
            Conference Full Paper
         </efrbr-expression:formOfExpression><efrbr-expression:dateOfExpression type="issued">2015-11-30</efrbr-expression:dateOfExpression><efrbr-expression:dateOfExpression type="published">2011</efrbr-expression:dateOfExpression><efrbr-expression:languageOfExpression vocabulary="iso639-1">en</efrbr-expression:languageOfExpression><efrbr-expression:summarizationOfContent>In the database community, work on information extraction (IE)
has centered on two themes: how to effectively manage IE tasks,
and how to manage the uncertainties that arise in the IE process
in a scalable manner. Recent work has proposed a probabilistic
database (PDB) based declarative IE system that supports a leading
statistical IE model, and an associated inference algorithm to
answer top-k-style queries over the probabilistic IE outcome. Still,
the broader problem of effectively supporting general probabilistic
inference inside a PDB-based declarative IE system remains
open. In this paper, we explore the in-database implementations of
a wide variety of inference algorithms suited to IE, including two
Markov chain Monte Carlo algorithms, Viterbi and sum-product algorithms.
We describe the rules for choosing appropriate inference
algorithms based on the model, the query and the text, considering
the trade-off between accuracy and runtime. Based on these rules,
we describe a hybrid approach to optimize the execution of a single
probabilistic IE query to employ different inference algorithms
appropriate for different records. We show that our techniques can
achieve up to 10-fold speedups compared to the non-hybrid solutions
proposed in the literature.</efrbr-expression:summarizationOfContent><efrbr-expression:useRestrictionsOnTheExpression type="creative-commons">http://creativecommons.org/licenses/by/4.0/</efrbr-expression:useRestrictionsOnTheExpression><efrbr-expression:note type="page range">517-528 </efrbr-expression:note><efrbr-expression:note type="conference name">ACM SIGMOD International Conference on Management of Data</efrbr-expression:note><efrbr-expression:note type="proceedings title">Proceedings of the 2011 ACM SIGMOD International Conference on Management of Data</efrbr-expression:note></efrbr-expression:expression><efrbr-person:person identifier="2DFFBC66-47EB-49CC-B1E7-935BFCF86319"><efrbr-person:nameOfPerson vocabulary="">
            Wang Daisy Zhe
         </efrbr-person:nameOfPerson></efrbr-person:person><efrbr-person:person identifier="A12ED487-3A0E-43EE-834D-57088E07BA9A"><efrbr-person:nameOfPerson vocabulary="">
            Franklin Michael J.
         </efrbr-person:nameOfPerson></efrbr-person:person><efrbr-person:person identifier="http://users.isc.tuc.gr/~mgarofalakis"><efrbr-person:nameOfPerson vocabulary="TUC:LDAP">
            Garofalakis Minos
            Γαροφαλακης Μινως
         </efrbr-person:nameOfPerson></efrbr-person:person><efrbr-person:person identifier="http://viaf.org/viaf/31030036"><efrbr-person:nameOfPerson vocabulary="VIAF">
            Hellerstein, Joseph, 1952-
         </efrbr-person:nameOfPerson></efrbr-person:person><efrbr-person:person identifier="90F58A11-7696-4B38-928E-8E2AE388B8CB"><efrbr-person:nameOfPerson vocabulary="">
            Wick Michael L.
         </efrbr-person:nameOfPerson></efrbr-person:person><efrbr-corporateBody:corporateBody identifier="http://www.acm.org/"><efrbr-corporateBody:nameOfTheCorporateBody vocabulary="S/R:PUBLISHERS">
            Association for Computing Machinery
         </efrbr-corporateBody:nameOfTheCorporateBody></efrbr-corporateBody:corporateBody><efrbr-concept:concept identifier="2C1F806D-555D-4C15-92EF-DD579B0529F5"><efrbr-concept:termForTheConcept>
            Database management
         </efrbr-concept:termForTheConcept></efrbr-concept:concept><efrbr-concept:concept identifier="DBCD4F91-FCD7-48A6-A6D6-EADAE6FECAD5"><efrbr-concept:termForTheConcept>
            Mathematics of computing
         </efrbr-concept:termForTheConcept></efrbr-concept:concept></efrbr:entities><efrbr:relationships><efrbr-structure:structureRelations><efrbr-structure:realizedThrough sourceEntity="work" sourceURI="http://purl.tuc.gr/dl/dias/9FBD290C-DC9B-419A-9A80-E532CB9521E0" targetEntity="expression" targetURI="http://purl.tuc.gr/dl/dias/9FBD290C-DC9B-419A-9A80-E532CB9521E0"/></efrbr-structure:structureRelations><efrbr-responsible:responsibleRelations><efrbr-responsible:createdBy sourceEntity="work" sourceURI="http://purl.tuc.gr/dl/dias/9FBD290C-DC9B-419A-9A80-E532CB9521E0" targetEntity="person" targetURI="2DFFBC66-47EB-49CC-B1E7-935BFCF86319"/><efrbr-responsible:realizedBy sourceEntity="expression" sourceURI="http://purl.tuc.gr/dl/dias/9FBD290C-DC9B-419A-9A80-E532CB9521E0" targetEntity="person" targetURI="2DFFBC66-47EB-49CC-B1E7-935BFCF86319" role="author"/><efrbr-responsible:realizedBy sourceEntity="expression" sourceURI="http://purl.tuc.gr/dl/dias/9FBD290C-DC9B-419A-9A80-E532CB9521E0" targetEntity="person" targetURI="A12ED487-3A0E-43EE-834D-57088E07BA9A" role="author"/><efrbr-responsible:realizedBy sourceEntity="expression" sourceURI="http://purl.tuc.gr/dl/dias/9FBD290C-DC9B-419A-9A80-E532CB9521E0" targetEntity="person" targetURI="http://users.isc.tuc.gr/~mgarofalakis" role="author"/><efrbr-responsible:realizedBy sourceEntity="expression" sourceURI="http://purl.tuc.gr/dl/dias/9FBD290C-DC9B-419A-9A80-E532CB9521E0" targetEntity="person" targetURI="http://viaf.org/viaf/31030036" role="author"/><efrbr-responsible:realizedBy sourceEntity="expression" sourceURI="http://purl.tuc.gr/dl/dias/9FBD290C-DC9B-419A-9A80-E532CB9521E0" targetEntity="person" targetURI="90F58A11-7696-4B38-928E-8E2AE388B8CB" role="author"/><efrbr-responsible:realizedBy sourceEntity="expression" sourceURI="http://purl.tuc.gr/dl/dias/9FBD290C-DC9B-419A-9A80-E532CB9521E0" targetEntity="person" targetURI="http://www.acm.org/" role="publisher"/></efrbr-responsible:responsibleRelations><efrbr-subject:subjectRelations><efrbr-subject:hasSubject sourceEntity="work" sourceURI="http://purl.tuc.gr/dl/dias/9FBD290C-DC9B-419A-9A80-E532CB9521E0" targetEntity="concept" targetURI="2C1F806D-555D-4C15-92EF-DD579B0529F5"/><efrbr-subject:hasSubject sourceEntity="work" sourceURI="http://purl.tuc.gr/dl/dias/9FBD290C-DC9B-419A-9A80-E532CB9521E0" targetEntity="concept" targetURI="DBCD4F91-FCD7-48A6-A6D6-EADAE6FECAD5"/></efrbr-subject:subjectRelations><efrbr-other:otherRelations/></efrbr:relationships></efrbr:recordSet>