MixCE: Training Autoregressive Language Models by Mixing Forward and Reverse Cross-Entropies.
Resource URI: https://dblp.l3s.de/d2r/resource/publications/conf/acl/ZhangWILBDR23
Home
|
Example Publications
Property
Value
dcterms:
bibliographicCitation
<
http://dblp.uni-trier.de/rec/bibtex/conf/acl/ZhangWILBDR23
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/David_S._Rosenberg
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Mark_Dredze
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Mohit_Bansal
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Ozan_Irsoy
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Shijie_Wu
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Shiyue_Zhang
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Steven_Lu_0003
>
foaf:
homepage
<
http://dx.doi.org/doi.org%2F10.18653%2Fv1%2F2023.acl-long.502
>
foaf:
homepage
<
https://doi.org/10.18653/v1/2023.acl-long.502
>
dc:
identifier
DBLP conf/acl/ZhangWILBDR23
(xsd:string)
dc:
identifier
DOI doi.org%2F10.18653%2Fv1%2F2023.acl-long.502
(xsd:string)
dcterms:
issued
2023
(xsd:gYear)
rdfs:
label
MixCE: Training Autoregressive Language Models by Mixing Forward and Reverse Cross-Entropies.
(xsd:string)
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/David_S._Rosenberg
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Mark_Dredze
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Mohit_Bansal
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Ozan_Irsoy
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Shijie_Wu
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Shiyue_Zhang
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Steven_Lu_0003
>
swrc:
pages
9027-9050
(xsd:string)
dcterms:
partOf
<
https://dblp.l3s.de/d2r/resource/publications/conf/acl/2023-1
>
owl:
sameAs
<
http://bibsonomy.org/uri/bibtexkey/conf/acl/ZhangWILBDR23/dblp
>
owl:
sameAs
<
http://dblp.rkbexplorer.com/id/conf/acl/ZhangWILBDR23
>
rdfs:
seeAlso
<
http://dblp.uni-trier.de/db/conf/acl/acl2023-1.html#ZhangWILBDR23
>
rdfs:
seeAlso
<
https://doi.org/10.18653/v1/2023.acl-long.502
>
swrc:
series
<
https://dblp.l3s.de/d2r/resource/conferences/acl
>
dc:
title
MixCE: Training Autoregressive Language Models by Mixing Forward and Reverse Cross-Entropies.
(xsd:string)
dc:
type
<
http://purl.org/dc/dcmitype/Text
>
rdf:
type
swrc:InProceedings
rdf:
type
foaf:Document