Pessimistic Minimax Value Iteration: Provably Efficient Equilibrium Learning from Offline Datasets.
Resource URI: https://dblp.l3s.de/d2r/resource/publications/conf/icml/ZhongXTWZWY22
Home
|
Example Publications
Property
Value
dcterms:
bibliographicCitation
<
http://dblp.uni-trier.de/rec/bibtex/conf/icml/ZhongXTWZWY22
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Han_Zhong_0001
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Jiyuan_Tan
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Liwei_Wang_0001
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Tong_Zhang_0001
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Wei_Xiong_0015
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Zhaoran_Wang_0001
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Zhuoran_Yang
>
foaf:
homepage
<
https://proceedings.mlr.press/v162/zhong22b.html
>
dc:
identifier
DBLP conf/icml/ZhongXTWZWY22
(xsd:string)
dcterms:
issued
2022
(xsd:gYear)
rdfs:
label
Pessimistic Minimax Value Iteration: Provably Efficient Equilibrium Learning from Offline Datasets.
(xsd:string)
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Han_Zhong_0001
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Jiyuan_Tan
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Liwei_Wang_0001
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Tong_Zhang_0001
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Wei_Xiong_0015
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Zhaoran_Wang_0001
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Zhuoran_Yang
>
swrc:
pages
27117-27142
(xsd:string)
dcterms:
partOf
<
https://dblp.l3s.de/d2r/resource/publications/conf/icml/2022
>
owl:
sameAs
<
http://bibsonomy.org/uri/bibtexkey/conf/icml/ZhongXTWZWY22/dblp
>
owl:
sameAs
<
http://dblp.rkbexplorer.com/id/conf/icml/ZhongXTWZWY22
>
rdfs:
seeAlso
<
http://dblp.uni-trier.de/db/conf/icml/icml2022.html#ZhongXTWZWY22
>
rdfs:
seeAlso
<
https://proceedings.mlr.press/v162/zhong22b.html
>
swrc:
series
<
https://dblp.l3s.de/d2r/resource/conferences/icml
>
dc:
title
Pessimistic Minimax Value Iteration: Provably Efficient Equilibrium Learning from Offline Datasets.
(xsd:string)
dc:
type
<
http://purl.org/dc/dcmitype/Text
>
rdf:
type
swrc:InProceedings
rdf:
type
foaf:Document