Convergence Proof for Actor-Critic Methods Applied to PPO and RUDDER.
Resource URI: https://dblp.l3s.de/d2r/resource/publications/journals/tlsdkcs/HolzleitnerGABH21
Home
|
Example Publications
Property
Value
dcterms:
bibliographicCitation
<
http://dblp.uni-trier.de/rec/bibtex/journals/tlsdkcs/HolzleitnerGABH21
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Johannes_Brandstetter
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Jos%E2%88%9A%C2%A9_Antonio_Arjona-Medina
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Lukas_Gruber
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Markus_Holzleitner
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Sepp_Hochreiter
>
foaf:
homepage
<
http://dx.doi.org/doi.org%2F10.1007%2F978-3-662-63519-3%5F5
>
foaf:
homepage
<
https://doi.org/10.1007/978-3-662-63519-3_5
>
dc:
identifier
DBLP journals/tlsdkcs/HolzleitnerGABH21
(xsd:string)
dc:
identifier
DOI doi.org%2F10.1007%2F978-3-662-63519-3%5F5
(xsd:string)
dcterms:
issued
2021
(xsd:gYear)
rdfs:
label
Convergence Proof for Actor-Critic Methods Applied to PPO and RUDDER.
(xsd:string)
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Johannes_Brandstetter
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Jos%E2%88%9A%C2%A9_Antonio_Arjona-Medina
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Lukas_Gruber
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Markus_Holzleitner
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Sepp_Hochreiter
>
swrc:
pages
105-130
(xsd:string)
dcterms:
partOf
<
https://dblp.l3s.de/d2r/resource/publications/journals/tlsdkcs/2021-48
>
owl:
sameAs
<
http://bibsonomy.org/uri/bibtexkey/journals/tlsdkcs/HolzleitnerGABH21/dblp
>
owl:
sameAs
<
http://dblp.rkbexplorer.com/id/journals/tlsdkcs/HolzleitnerGABH21
>
rdfs:
seeAlso
<
http://dblp.uni-trier.de/db/journals/tlsdkcs/tlsdkcs48.html#HolzleitnerGABH21
>
rdfs:
seeAlso
<
https://doi.org/10.1007/978-3-662-63519-3_5
>
swrc:
series
<
https://dblp.l3s.de/d2r/resource/conferences/tlsdkcs
>
dc:
title
Convergence Proof for Actor-Critic Methods Applied to PPO and RUDDER.
(xsd:string)
dc:
type
<
http://purl.org/dc/dcmitype/Text
>
rdf:
type
swrc:InProceedings
rdf:
type
foaf:Document
swrc:
volume
48
(xsd:string)