[RDF data]
Home | Example Publications
PropertyValue
dcterms:bibliographicCitation <http://dblp.uni-trier.de/rec/bibtex/journals/aamas/BuffetDC07>
dc:creator <http://dblp.l3s.de/d2r/resource/authors/Alain_Dutech>
dc:creator <http://dblp.l3s.de/d2r/resource/authors/Fran%C3%A7ois_Charpillet>
dc:creator <http://dblp.l3s.de/d2r/resource/authors/Olivier_Buffet>
foaf:homepage <http://dx.doi.org/10.1007%2Fs10458-006-9010-5>
foaf:homepage <http://dx.doi.org/10.1007/s10458-006-9010-5>
dc:identifier DBLP journals/aamas/BuffetDC07 (xsd:string)
dc:identifier DOI 10.1007%2Fs10458-006-9010-5 (xsd:string)
dcterms:issued 2007 (xsd:gYear)
swrc:journal <http://dblp.l3s.de/d2r/resource/journals/aamas>
rdfs:label Shaping multi-agent systems with gradient reinforcement learning. (xsd:string)
foaf:maker <http://dblp.l3s.de/d2r/resource/authors/Alain_Dutech>
foaf:maker <http://dblp.l3s.de/d2r/resource/authors/Fran%C3%A7ois_Charpillet>
foaf:maker <http://dblp.l3s.de/d2r/resource/authors/Olivier_Buffet>
swrc:number 2 (xsd:string)
swrc:pages 197-220 (xsd:string)
owl:sameAs <http://bibsonomy.org/uri/bibtexkey/journals/aamas/BuffetDC07/dblp>
owl:sameAs <http://dblp.rkbexplorer.com/id/journals/aamas/BuffetDC07>
rdfs:seeAlso <http://dblp.uni-trier.de/db/journals/aamas/aamas15.html#BuffetDC07>
rdfs:seeAlso <http://dx.doi.org/10.1007/s10458-006-9010-5>
dc:subject Reinforcement learning; Multi-agent systems; Partially observable Markov decision processes; Shaping; Policy-gradient (xsd:string)
dc:title Shaping multi-agent systems with gradient reinforcement learning. (xsd:string)
dc:type <http://purl.org/dc/dcmitype/Text>
rdf:type swrc:Article
rdf:type foaf:Document
swrc:volume 15 (xsd:string)