<efrbr:recordSet xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:efrbr="http://vfrbr.info/efrbr/1.1" xmlns:efrbr-work="http://vfrbr.info/efrbr/1.1/work" xmlns:efrbr-expression="http://vfrbr.info/efrbr/1.1/expression" xmlns:efrbr-manifestation="http://vfrbr.info/efrbr/1.1/manifestation" xmlns:efrbr-person="http://vfrbr.info/efrbr/1.1/person" xmlns:efrbr-corporateBody="http://vfrbr.info/efrbr/1.1/corporateBody" xmlns:efrbr-concept="http://vfrbr.info/efrbr/1.1/concept" xmlns:efrbr-structure="http://vfrbr.info/efrbr/1.1/structure" xmlns:efrbr-responsible="http://vfrbr.info/efrbr/1.1/responsible" xmlns:efrbr-subject="http://vfrbr.info/efrbr/1.1/subject" xmlns:efrbr-other="http://vfrbr.info/efrbr/1.1/other" xsi:schemaLocation="http://vfrbr.info/efrbr/1.1 http://vfrbr.info/schemas/1.1/efrbr.xsd"><efrbr:entities><efrbr-work:work identifier="http://purl.tuc.gr/dl/dias/FBB6EA9E-B181-4D39-8F6C-4DDB3B0278DA"><efrbr-work:titleOfTheWork>Learning in zero–sum team Markov games using factored value functions</efrbr-work:titleOfTheWork></efrbr-work:work><efrbr-expression:expression identifier="http://purl.tuc.gr/dl/dias/FBB6EA9E-B181-4D39-8F6C-4DDB3B0278DA"><efrbr-expression:titleOfTheExpression>Learning in zero–sum team Markov games using factored value functions</efrbr-expression:titleOfTheExpression><efrbr-expression:formOfExpression vocabulary="DIAS:TYPES">
            Πλήρης Δημοσίευση σε Συνέδριο
            Conference Full Paper
         </efrbr-expression:formOfExpression><efrbr-expression:dateOfExpression type="issued">2015-11-13</efrbr-expression:dateOfExpression><efrbr-expression:dateOfExpression type="published">2002</efrbr-expression:dateOfExpression><efrbr-expression:languageOfExpression vocabulary="iso639-1">en</efrbr-expression:languageOfExpression><efrbr-expression:summarizationOfContent>We present a new method for learning good strategies in zero-sum
Markov games in which each side is composed of multiple agents collaborating
against an opposing team of agents. Our method requires full
observability and communication during learning, but the learned policies
can be executed in a distributed manner. The value function is represented
as a factored linear architecture and its structure determines the
necessary computational resources and communication bandwidth. This
approach permits a tradeoff between simple representations with little or
no communication between agents and complex, computationally intensive
representations with extensive coordination between agents. Thus,
we provide a principled means of using approximation to combat the
exponential blowup in the joint action space of the participants. The approach
is demonstrated with an example that shows the efficiency gains
over naive enumeration.
</efrbr-expression:summarizationOfContent><efrbr-expression:useRestrictionsOnTheExpression type="creative-commons">http://creativecommons.org/licenses/by/4.0/</efrbr-expression:useRestrictionsOnTheExpression><efrbr-expression:note type="page range">1659–1666</efrbr-expression:note><efrbr-expression:note type="conference name">Neural Information Processing Systems</efrbr-expression:note><efrbr-expression:note type="proceedings title">Proceedings of NIPS 2002: Neural Information Processing Systems, Vancouver, BC, Canada</efrbr-expression:note></efrbr-expression:expression><efrbr-person:person identifier="http://users.isc.tuc.gr/~lagoudakis"><efrbr-person:nameOfPerson vocabulary="TUC:LDAP">
            Lagoudakis Michael
            Λαγουδακης Μιχαηλ
         </efrbr-person:nameOfPerson></efrbr-person:person><efrbr-person:person identifier="554BE05E-EAF7-4BE5-B322-12042364A6EB"><efrbr-person:nameOfPerson vocabulary="">
            Parr, R.
         </efrbr-person:nameOfPerson></efrbr-person:person><efrbr-concept:concept identifier="http://id.loc.gov/authorities/subjects/sh2007000125"><efrbr-concept:termForTheConcept>
            HMMs (Hidden Markov models)
            hidden markov models
            hmms hidden markov models
         </efrbr-concept:termForTheConcept></efrbr-concept:concept></efrbr:entities><efrbr:relationships><efrbr-structure:structureRelations><efrbr-structure:realizedThrough sourceEntity="work" targetEntity="expression" sourceURI="http://purl.tuc.gr/dl/dias/FBB6EA9E-B181-4D39-8F6C-4DDB3B0278DA" targetURI="http://purl.tuc.gr/dl/dias/FBB6EA9E-B181-4D39-8F6C-4DDB3B0278DA"/></efrbr-structure:structureRelations><efrbr-responsible:responsibleRelations><efrbr-responsible:createdBy sourceEntity="work" targetEntity="person" sourceURI="http://purl.tuc.gr/dl/dias/FBB6EA9E-B181-4D39-8F6C-4DDB3B0278DA" targetURI="http://users.isc.tuc.gr/~lagoudakis"/><efrbr-responsible:realizedBy sourceEntity="expression" role="author" targetEntity="person" sourceURI="http://purl.tuc.gr/dl/dias/FBB6EA9E-B181-4D39-8F6C-4DDB3B0278DA" targetURI="http://users.isc.tuc.gr/~lagoudakis"/><efrbr-responsible:realizedBy sourceEntity="expression" role="author" targetEntity="person" sourceURI="http://purl.tuc.gr/dl/dias/FBB6EA9E-B181-4D39-8F6C-4DDB3B0278DA" targetURI="554BE05E-EAF7-4BE5-B322-12042364A6EB"/></efrbr-responsible:responsibleRelations><efrbr-subject:subjectRelations><efrbr-subject:hasSubject sourceEntity="work" targetEntity="concept" sourceURI="http://purl.tuc.gr/dl/dias/FBB6EA9E-B181-4D39-8F6C-4DDB3B0278DA" targetURI="http://id.loc.gov/authorities/subjects/sh2007000125"/></efrbr-subject:subjectRelations><efrbr-other:otherRelations/></efrbr:relationships></efrbr:recordSet>