Discounting-free policy gradient reinforcement learning from transient states
Resource URI: https://dblp.l3s.de/d2r/resource/publications/phd/au/Dewanto22
Home
|
Example Publications
Property
Value
dcterms:
bibliographicCitation
<
http://dblp.uni-trier.de/rec/bibtex/phd/au/Dewanto22
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Vektor_Dewanto
>
foaf:
homepage
<
http://dx.doi.org/doi.org%2F10.14264%2F9d6f9aa
>
foaf:
homepage
<
https://doi.org/10.14264/9d6f9aa
>
dc:
identifier
DBLP phd/au/Dewanto22
(xsd:string)
dc:
identifier
DOI doi.org%2F10.14264%2F9d6f9aa
(xsd:string)
dcterms:
issued
2022
(xsd:gYear)
rdfs:
label
Discounting-free policy gradient reinforcement learning from transient states
(xsd:string)
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Vektor_Dewanto
>
dc:
publisher
University of Queensland, Australia
(xsd:string)
owl:
sameAs
<
http://bibsonomy.org/uri/bibtexkey/phd/au/Dewanto22/dblp
>
owl:
sameAs
<
http://dblp.rkbexplorer.com/id/phd/au/Dewanto22
>
rdfs:
seeAlso
<
https://doi.org/10.14264/9d6f9aa
>
dc:
title
Discounting-free policy gradient reinforcement learning from transient states
(xsd:string)
dc:
type
<
http://purl.org/dc/dcmitype/Text
>
rdf:
type
swrc:PhDThesis
rdf:
type
foaf:Document