The Capacity for Moral Self-Correction in Large Language Models.
Resource URI: https://dblp.l3s.de/d2r/resource/publications/journals/corr/abs-2302-07459
Home
|
Example Publications
Property
Value
dcterms:
bibliographicCitation
<
http://dblp.uni-trier.de/rec/bibtex/journals/corr/abs-2302-07459
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Amanda_Askell
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Anna_Chen
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Anna_Goldie
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Azalia_Mirhoseini
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Ben_Mann
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Catherine_Olsson
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Christopher_Olah
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Danny_Hernandez
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Dario_Amodei
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Dawn_Drain
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Deep_Ganguli
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Dustin_Li
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Eli_Tran-Johnson
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Ethan_Perez
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Jack_Clark
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Jackson_Kernion
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Jamie_Kerr
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Jared_Kaplan
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Jared_Mueller
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Joshua_Landau
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Kamal_Ndousse
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Kamile_Lukosiute
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Karina_Nguyen
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Liane_Lovitt
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Michael_Sellitto
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Nelson_Elhage
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Nicholas_Joseph
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Nicholas_Schiefer
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Noem%E2%88%9A%E2%89%A0_Mercado
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Nova_DasSarma
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Oliver_Rausch
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Robert_Lasenby
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Robin_Larson
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Sam_McCandlish
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Sam_Ringer
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Samuel_R._Bowman
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Sandipan_Kundu
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Saurav_Kadavath
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Scott_Johnston
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Shauna_Kravec
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Sheer_El_Showk
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Tamera_Lanham
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Thomas_I._Liao
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Timothy_Telleen-Lawton
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Tom_Brown
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Tom_Henighan
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Tristan_Hume
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Yuntao_Bai
>
dc:
creator
<
https://dblp.l3s.de/d2r/resource/authors/Zac_Hatfield-Dodds
>
foaf:
homepage
<
http://dx.doi.org/doi.org%2F10.48550%2FarXiv.2302.07459
>
foaf:
homepage
<
https://doi.org/10.48550/arXiv.2302.07459
>
dc:
identifier
DBLP journals/corr/abs-2302-07459
(xsd:string)
dc:
identifier
DOI doi.org%2F10.48550%2FarXiv.2302.07459
(xsd:string)
dcterms:
issued
2023
(xsd:gYear)
swrc:
journal
<
https://dblp.l3s.de/d2r/resource/journals/corr
>
rdfs:
label
The Capacity for Moral Self-Correction in Large Language Models.
(xsd:string)
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Amanda_Askell
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Anna_Chen
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Anna_Goldie
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Azalia_Mirhoseini
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Ben_Mann
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Catherine_Olsson
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Christopher_Olah
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Danny_Hernandez
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Dario_Amodei
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Dawn_Drain
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Deep_Ganguli
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Dustin_Li
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Eli_Tran-Johnson
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Ethan_Perez
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Jack_Clark
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Jackson_Kernion
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Jamie_Kerr
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Jared_Kaplan
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Jared_Mueller
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Joshua_Landau
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Kamal_Ndousse
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Kamile_Lukosiute
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Karina_Nguyen
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Liane_Lovitt
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Michael_Sellitto
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Nelson_Elhage
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Nicholas_Joseph
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Nicholas_Schiefer
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Noem%E2%88%9A%E2%89%A0_Mercado
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Nova_DasSarma
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Oliver_Rausch
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Robert_Lasenby
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Robin_Larson
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Sam_McCandlish
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Sam_Ringer
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Samuel_R._Bowman
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Sandipan_Kundu
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Saurav_Kadavath
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Scott_Johnston
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Shauna_Kravec
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Sheer_El_Showk
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Tamera_Lanham
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Thomas_I._Liao
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Timothy_Telleen-Lawton
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Tom_Brown
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Tom_Henighan
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Tristan_Hume
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Yuntao_Bai
>
foaf:
maker
<
https://dblp.l3s.de/d2r/resource/authors/Zac_Hatfield-Dodds
>
owl:
sameAs
<
http://bibsonomy.org/uri/bibtexkey/journals/corr/abs-2302-07459/dblp
>
owl:
sameAs
<
http://dblp.rkbexplorer.com/id/journals/corr/abs-2302-07459
>
rdfs:
seeAlso
<
http://dblp.uni-trier.de/db/journals/corr/corr2302.html#abs-2302-07459
>
rdfs:
seeAlso
<
https://doi.org/10.48550/arXiv.2302.07459
>
dc:
title
The Capacity for Moral Self-Correction in Large Language Models.
(xsd:string)
dc:
type
<
http://purl.org/dc/dcmitype/Text
>
rdf:
type
swrc:Article
rdf:
type
foaf:Document
swrc:
volume
abs/2302.07459
(xsd:string)