DeepSeekMoE: Towards Ultimate Expert Specialization in Mixture-of-Experts Language Models.
Resource URI: https://dblp.l3s.de/d2r/resource/publications/journals/corr/abs-2401-06066
Home
|
Example Publications
Property
Value
dcterms:
bibliographicCitation
<
http://dblp.uni-trier.de/rec/bibtex/journals/corr/abs-2401-06066
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Chenggang_Zhao
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Chengqi_Deng
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Chong_Ruan
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Damai_Dai
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Deli_Chen
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Fuli_Luo
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Huazuo_Gao
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Jiashi_Li
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Panpan_Huang
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/R._X._Xu
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Wangding_Zeng
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Wenfeng_Liang
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Xingkai_Yu
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Y._K._Li
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Y._Wu
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Zhenda_Xie
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Zhifang_Sui
>
foaf:
homepage
<
http://dx.doi.org/doi.org%2F10.48550%2FarXiv.2401.06066
>
foaf:
homepage
<
https://doi.org/10.48550/arXiv.2401.06066
>
dc:
identifier
DBLP journals/corr/abs-2401-06066
(xsd:string)
dc:
identifier
DOI doi.org%2F10.48550%2FarXiv.2401.06066
(xsd:string)
dcterms:
issued
2024
(xsd:gYear)
swrc:
journal
<
https://dblp.l3s.de/d2r/resource/journals/corr
>
rdfs:
label
DeepSeekMoE: Towards Ultimate Expert Specialization in Mixture-of-Experts Language Models.
(xsd:string)
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Chenggang_Zhao
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Chengqi_Deng
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Chong_Ruan
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Damai_Dai
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Deli_Chen
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Fuli_Luo
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Huazuo_Gao
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Jiashi_Li
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Panpan_Huang
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/R._X._Xu
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Wangding_Zeng
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Wenfeng_Liang
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Xingkai_Yu
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Y._K._Li
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Y._Wu
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Zhenda_Xie
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Zhifang_Sui
>
owl:
sameAs
<
http://bibsonomy.org/uri/bibtexkey/journals/corr/abs-2401-06066/dblp
>
owl:
sameAs
<
http://dblp.rkbexplorer.com/id/journals/corr/abs-2401-06066
>
rdfs:
seeAlso
<
http://dblp.uni-trier.de/db/journals/corr/corr2401.html#abs-2401-06066
>
rdfs:
seeAlso
<
https://doi.org/10.48550/arXiv.2401.06066
>
dc:
title
DeepSeekMoE: Towards Ultimate Expert Specialization in Mixture-of-Experts Language Models.
(xsd:string)
dc:
type
<
http://purl.org/dc/dcmitype/Text
>
rdf:
type
swrc:Article
rdf:
type
foaf:Document
swrc:
volume
abs/2401.06066
(xsd:string)