[RDF data]
Home | Example Publications
PropertyValue
dcterms:bibliographicCitation <http://dblp.uni-trier.de/rec/bibtex/journals/corr/abs-2110-13799>
dc:creator <https://dblp.l3s.de/d2r/resource/authors/Hsuan-Yu_Yao>
dc:creator <https://dblp.l3s.de/d2r/resource/authors/I-Chen_Wu>
dc:creator <https://dblp.l3s.de/d2r/resource/authors/Kai-Chun_Hu>
dc:creator <https://dblp.l3s.de/d2r/resource/authors/Kuo-Hao_Ho>
dc:creator <https://dblp.l3s.de/d2r/resource/authors/Liang-Chun_Ouyang>
dc:creator <https://dblp.l3s.de/d2r/resource/authors/Ping-Chun_Hsieh>
foaf:homepage <https://arxiv.org/abs/2110.13799>
dc:identifier DBLP journals/corr/abs-2110-13799 (xsd:string)
dcterms:issued 2021 (xsd:gYear)
swrc:journal <https://dblp.l3s.de/d2r/resource/journals/corr>
rdfs:label Hinge Policy Optimization: Rethinking Policy Improvement and Reinterpreting PPO. (xsd:string)
foaf:maker <https://dblp.l3s.de/d2r/resource/authors/Hsuan-Yu_Yao>
foaf:maker <https://dblp.l3s.de/d2r/resource/authors/I-Chen_Wu>
foaf:maker <https://dblp.l3s.de/d2r/resource/authors/Kai-Chun_Hu>
foaf:maker <https://dblp.l3s.de/d2r/resource/authors/Kuo-Hao_Ho>
foaf:maker <https://dblp.l3s.de/d2r/resource/authors/Liang-Chun_Ouyang>
foaf:maker <https://dblp.l3s.de/d2r/resource/authors/Ping-Chun_Hsieh>
owl:sameAs <http://bibsonomy.org/uri/bibtexkey/journals/corr/abs-2110-13799/dblp>
owl:sameAs <http://dblp.rkbexplorer.com/id/journals/corr/abs-2110-13799>
rdfs:seeAlso <http://dblp.uni-trier.de/db/journals/corr/corr2110.html#abs-2110-13799>
rdfs:seeAlso <https://arxiv.org/abs/2110.13799>
dc:title Hinge Policy Optimization: Rethinking Policy Improvement and Reinterpreting PPO. (xsd:string)
dc:type <http://purl.org/dc/dcmitype/Text>
rdf:type swrc:Article
rdf:type foaf:Document
swrc:volume abs/2110.13799 (xsd:string)