Hinge Policy Optimization: Rethinking Policy Improvement and Reinterpreting PPO.
Resource URI: https://dblp.l3s.de/d2r/resource/publications/journals/corr/abs-2110-13799
Home
|
Example Publications
Property
Value
dcterms:
bibliographicCitation
<
http://dblp.uni-trier.de/rec/bibtex/journals/corr/abs-2110-13799
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Hsuan-Yu_Yao
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/I-Chen_Wu
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Kai-Chun_Hu
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Kuo-Hao_Ho
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Liang-Chun_Ouyang
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Ping-Chun_Hsieh
>
foaf:
homepage
<
https://arxiv.org/abs/2110.13799
>
dc:
identifier
DBLP journals/corr/abs-2110-13799
(xsd:string)
dcterms:
issued
2021
(xsd:gYear)
swrc:
journal
<
https://dblp.l3s.de/d2r/resource/journals/corr
>
rdfs:
label
Hinge Policy Optimization: Rethinking Policy Improvement and Reinterpreting PPO.
(xsd:string)
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Hsuan-Yu_Yao
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/I-Chen_Wu
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Kai-Chun_Hu
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Kuo-Hao_Ho
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Liang-Chun_Ouyang
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Ping-Chun_Hsieh
>
owl:
sameAs
<
http://bibsonomy.org/uri/bibtexkey/journals/corr/abs-2110-13799/dblp
>
owl:
sameAs
<
http://dblp.rkbexplorer.com/id/journals/corr/abs-2110-13799
>
rdfs:
seeAlso
<
http://dblp.uni-trier.de/db/journals/corr/corr2110.html#abs-2110-13799
>
rdfs:
seeAlso
<
https://arxiv.org/abs/2110.13799
>
dc:
title
Hinge Policy Optimization: Rethinking Policy Improvement and Reinterpreting PPO.
(xsd:string)
dc:
type
<
http://purl.org/dc/dcmitype/Text
>
rdf:
type
swrc:Article
rdf:
type
foaf:Document
swrc:
volume
abs/2110.13799
(xsd:string)