1 Star 2 Fork 2

Hugging Face 模型镜像 / Qwen-72B-Chat

加入 Gitee
与超过 1200万 开发者一起发现、参与优秀开源项目,私有仓库也完全免费 :)
免费加入
克隆/下载
model.safetensors.index.json 47.45 KB
一键复制 编辑 原始数据 按行查看 历史
yangapku 提交于 2023-11-29 18:43 . init upload
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650
{
"metadata": {
"total_size": 144575840256
},
"weight_map": {
"lm_head.weight": "model-00082-of-00082.safetensors",
"transformer.h.0.attn.c_attn.bias": "model-00002-of-00082.safetensors",
"transformer.h.0.attn.c_attn.weight": "model-00002-of-00082.safetensors",
"transformer.h.0.attn.c_proj.weight": "model-00002-of-00082.safetensors",
"transformer.h.0.ln_1.weight": "model-00002-of-00082.safetensors",
"transformer.h.0.ln_2.weight": "model-00002-of-00082.safetensors",
"transformer.h.0.mlp.c_proj.weight": "model-00002-of-00082.safetensors",
"transformer.h.0.mlp.w1.weight": "model-00002-of-00082.safetensors",
"transformer.h.0.mlp.w2.weight": "model-00002-of-00082.safetensors",
"transformer.h.1.attn.c_attn.bias": "model-00003-of-00082.safetensors",
"transformer.h.1.attn.c_attn.weight": "model-00003-of-00082.safetensors",
"transformer.h.1.attn.c_proj.weight": "model-00003-of-00082.safetensors",
"transformer.h.1.ln_1.weight": "model-00002-of-00082.safetensors",
"transformer.h.1.ln_2.weight": "model-00003-of-00082.safetensors",
"transformer.h.1.mlp.c_proj.weight": "model-00003-of-00082.safetensors",
"transformer.h.1.mlp.w1.weight": "model-00003-of-00082.safetensors",
"transformer.h.1.mlp.w2.weight": "model-00003-of-00082.safetensors",
"transformer.h.10.attn.c_attn.bias": "model-00012-of-00082.safetensors",
"transformer.h.10.attn.c_attn.weight": "model-00012-of-00082.safetensors",
"transformer.h.10.attn.c_proj.weight": "model-00012-of-00082.safetensors",
"transformer.h.10.ln_1.weight": "model-00011-of-00082.safetensors",
"transformer.h.10.ln_2.weight": "model-00012-of-00082.safetensors",
"transformer.h.10.mlp.c_proj.weight": "model-00012-of-00082.safetensors",
"transformer.h.10.mlp.w1.weight": "model-00012-of-00082.safetensors",
"transformer.h.10.mlp.w2.weight": "model-00012-of-00082.safetensors",
"transformer.h.11.attn.c_attn.bias": "model-00013-of-00082.safetensors",
"transformer.h.11.attn.c_attn.weight": "model-00013-of-00082.safetensors",
"transformer.h.11.attn.c_proj.weight": "model-00013-of-00082.safetensors",
"transformer.h.11.ln_1.weight": "model-00012-of-00082.safetensors",
"transformer.h.11.ln_2.weight": "model-00013-of-00082.safetensors",
"transformer.h.11.mlp.c_proj.weight": "model-00013-of-00082.safetensors",
"transformer.h.11.mlp.w1.weight": "model-00013-of-00082.safetensors",
"transformer.h.11.mlp.w2.weight": "model-00013-of-00082.safetensors",
"transformer.h.12.attn.c_attn.bias": "model-00014-of-00082.safetensors",
"transformer.h.12.attn.c_attn.weight": "model-00014-of-00082.safetensors",
"transformer.h.12.attn.c_proj.weight": "model-00014-of-00082.safetensors",
"transformer.h.12.ln_1.weight": "model-00013-of-00082.safetensors",
"transformer.h.12.ln_2.weight": "model-00014-of-00082.safetensors",
"transformer.h.12.mlp.c_proj.weight": "model-00014-of-00082.safetensors",
"transformer.h.12.mlp.w1.weight": "model-00014-of-00082.safetensors",
"transformer.h.12.mlp.w2.weight": "model-00014-of-00082.safetensors",
"transformer.h.13.attn.c_attn.bias": "model-00015-of-00082.safetensors",
"transformer.h.13.attn.c_attn.weight": "model-00015-of-00082.safetensors",
"transformer.h.13.attn.c_proj.weight": "model-00015-of-00082.safetensors",
"transformer.h.13.ln_1.weight": "model-00014-of-00082.safetensors",
"transformer.h.13.ln_2.weight": "model-00015-of-00082.safetensors",
"transformer.h.13.mlp.c_proj.weight": "model-00015-of-00082.safetensors",
"transformer.h.13.mlp.w1.weight": "model-00015-of-00082.safetensors",
"transformer.h.13.mlp.w2.weight": "model-00015-of-00082.safetensors",
"transformer.h.14.attn.c_attn.bias": "model-00016-of-00082.safetensors",
"transformer.h.14.attn.c_attn.weight": "model-00016-of-00082.safetensors",
"transformer.h.14.attn.c_proj.weight": "model-00016-of-00082.safetensors",
"transformer.h.14.ln_1.weight": "model-00015-of-00082.safetensors",
"transformer.h.14.ln_2.weight": "model-00016-of-00082.safetensors",
"transformer.h.14.mlp.c_proj.weight": "model-00016-of-00082.safetensors",
"transformer.h.14.mlp.w1.weight": "model-00016-of-00082.safetensors",
"transformer.h.14.mlp.w2.weight": "model-00016-of-00082.safetensors",
"transformer.h.15.attn.c_attn.bias": "model-00017-of-00082.safetensors",
"transformer.h.15.attn.c_attn.weight": "model-00017-of-00082.safetensors",
"transformer.h.15.attn.c_proj.weight": "model-00017-of-00082.safetensors",
"transformer.h.15.ln_1.weight": "model-00016-of-00082.safetensors",
"transformer.h.15.ln_2.weight": "model-00017-of-00082.safetensors",
"transformer.h.15.mlp.c_proj.weight": "model-00017-of-00082.safetensors",
"transformer.h.15.mlp.w1.weight": "model-00017-of-00082.safetensors",
"transformer.h.15.mlp.w2.weight": "model-00017-of-00082.safetensors",
"transformer.h.16.attn.c_attn.bias": "model-00018-of-00082.safetensors",
"transformer.h.16.attn.c_attn.weight": "model-00018-of-00082.safetensors",
"transformer.h.16.attn.c_proj.weight": "model-00018-of-00082.safetensors",
"transformer.h.16.ln_1.weight": "model-00017-of-00082.safetensors",
"transformer.h.16.ln_2.weight": "model-00018-of-00082.safetensors",
"transformer.h.16.mlp.c_proj.weight": "model-00018-of-00082.safetensors",
"transformer.h.16.mlp.w1.weight": "model-00018-of-00082.safetensors",
"transformer.h.16.mlp.w2.weight": "model-00018-of-00082.safetensors",
"transformer.h.17.attn.c_attn.bias": "model-00019-of-00082.safetensors",
"transformer.h.17.attn.c_attn.weight": "model-00019-of-00082.safetensors",
"transformer.h.17.attn.c_proj.weight": "model-00019-of-00082.safetensors",
"transformer.h.17.ln_1.weight": "model-00018-of-00082.safetensors",
"transformer.h.17.ln_2.weight": "model-00019-of-00082.safetensors",
"transformer.h.17.mlp.c_proj.weight": "model-00019-of-00082.safetensors",
"transformer.h.17.mlp.w1.weight": "model-00019-of-00082.safetensors",
"transformer.h.17.mlp.w2.weight": "model-00019-of-00082.safetensors",
"transformer.h.18.attn.c_attn.bias": "model-00020-of-00082.safetensors",
"transformer.h.18.attn.c_attn.weight": "model-00020-of-00082.safetensors",
"transformer.h.18.attn.c_proj.weight": "model-00020-of-00082.safetensors",
"transformer.h.18.ln_1.weight": "model-00019-of-00082.safetensors",
"transformer.h.18.ln_2.weight": "model-00020-of-00082.safetensors",
"transformer.h.18.mlp.c_proj.weight": "model-00020-of-00082.safetensors",
"transformer.h.18.mlp.w1.weight": "model-00020-of-00082.safetensors",
"transformer.h.18.mlp.w2.weight": "model-00020-of-00082.safetensors",
"transformer.h.19.attn.c_attn.bias": "model-00021-of-00082.safetensors",
"transformer.h.19.attn.c_attn.weight": "model-00021-of-00082.safetensors",
"transformer.h.19.attn.c_proj.weight": "model-00021-of-00082.safetensors",
"transformer.h.19.ln_1.weight": "model-00020-of-00082.safetensors",
"transformer.h.19.ln_2.weight": "model-00021-of-00082.safetensors",
"transformer.h.19.mlp.c_proj.weight": "model-00021-of-00082.safetensors",
"transformer.h.19.mlp.w1.weight": "model-00021-of-00082.safetensors",
"transformer.h.19.mlp.w2.weight": "model-00021-of-00082.safetensors",
"transformer.h.2.attn.c_attn.bias": "model-00004-of-00082.safetensors",
"transformer.h.2.attn.c_attn.weight": "model-00004-of-00082.safetensors",
"transformer.h.2.attn.c_proj.weight": "model-00004-of-00082.safetensors",
"transformer.h.2.ln_1.weight": "model-00003-of-00082.safetensors",
"transformer.h.2.ln_2.weight": "model-00004-of-00082.safetensors",
"transformer.h.2.mlp.c_proj.weight": "model-00004-of-00082.safetensors",
"transformer.h.2.mlp.w1.weight": "model-00004-of-00082.safetensors",
"transformer.h.2.mlp.w2.weight": "model-00004-of-00082.safetensors",
"transformer.h.20.attn.c_attn.bias": "model-00022-of-00082.safetensors",
"transformer.h.20.attn.c_attn.weight": "model-00022-of-00082.safetensors",
"transformer.h.20.attn.c_proj.weight": "model-00022-of-00082.safetensors",
"transformer.h.20.ln_1.weight": "model-00021-of-00082.safetensors",
"transformer.h.20.ln_2.weight": "model-00022-of-00082.safetensors",
"transformer.h.20.mlp.c_proj.weight": "model-00022-of-00082.safetensors",
"transformer.h.20.mlp.w1.weight": "model-00022-of-00082.safetensors",
"transformer.h.20.mlp.w2.weight": "model-00022-of-00082.safetensors",
"transformer.h.21.attn.c_attn.bias": "model-00023-of-00082.safetensors",
"transformer.h.21.attn.c_attn.weight": "model-00023-of-00082.safetensors",
"transformer.h.21.attn.c_proj.weight": "model-00023-of-00082.safetensors",
"transformer.h.21.ln_1.weight": "model-00022-of-00082.safetensors",
"transformer.h.21.ln_2.weight": "model-00023-of-00082.safetensors",
"transformer.h.21.mlp.c_proj.weight": "model-00023-of-00082.safetensors",
"transformer.h.21.mlp.w1.weight": "model-00023-of-00082.safetensors",
"transformer.h.21.mlp.w2.weight": "model-00023-of-00082.safetensors",
"transformer.h.22.attn.c_attn.bias": "model-00024-of-00082.safetensors",
"transformer.h.22.attn.c_attn.weight": "model-00024-of-00082.safetensors",
"transformer.h.22.attn.c_proj.weight": "model-00024-of-00082.safetensors",
"transformer.h.22.ln_1.weight": "model-00023-of-00082.safetensors",
"transformer.h.22.ln_2.weight": "model-00024-of-00082.safetensors",
"transformer.h.22.mlp.c_proj.weight": "model-00024-of-00082.safetensors",
"transformer.h.22.mlp.w1.weight": "model-00024-of-00082.safetensors",
"transformer.h.22.mlp.w2.weight": "model-00024-of-00082.safetensors",
"transformer.h.23.attn.c_attn.bias": "model-00025-of-00082.safetensors",
"transformer.h.23.attn.c_attn.weight": "model-00025-of-00082.safetensors",
"transformer.h.23.attn.c_proj.weight": "model-00025-of-00082.safetensors",
"transformer.h.23.ln_1.weight": "model-00024-of-00082.safetensors",
"transformer.h.23.ln_2.weight": "model-00025-of-00082.safetensors",
"transformer.h.23.mlp.c_proj.weight": "model-00025-of-00082.safetensors",
"transformer.h.23.mlp.w1.weight": "model-00025-of-00082.safetensors",
"transformer.h.23.mlp.w2.weight": "model-00025-of-00082.safetensors",
"transformer.h.24.attn.c_attn.bias": "model-00026-of-00082.safetensors",
"transformer.h.24.attn.c_attn.weight": "model-00026-of-00082.safetensors",
"transformer.h.24.attn.c_proj.weight": "model-00026-of-00082.safetensors",
"transformer.h.24.ln_1.weight": "model-00025-of-00082.safetensors",
"transformer.h.24.ln_2.weight": "model-00026-of-00082.safetensors",
"transformer.h.24.mlp.c_proj.weight": "model-00026-of-00082.safetensors",
"transformer.h.24.mlp.w1.weight": "model-00026-of-00082.safetensors",
"transformer.h.24.mlp.w2.weight": "model-00026-of-00082.safetensors",
"transformer.h.25.attn.c_attn.bias": "model-00027-of-00082.safetensors",
"transformer.h.25.attn.c_attn.weight": "model-00027-of-00082.safetensors",
"transformer.h.25.attn.c_proj.weight": "model-00027-of-00082.safetensors",
"transformer.h.25.ln_1.weight": "model-00026-of-00082.safetensors",
"transformer.h.25.ln_2.weight": "model-00027-of-00082.safetensors",
"transformer.h.25.mlp.c_proj.weight": "model-00027-of-00082.safetensors",
"transformer.h.25.mlp.w1.weight": "model-00027-of-00082.safetensors",
"transformer.h.25.mlp.w2.weight": "model-00027-of-00082.safetensors",
"transformer.h.26.attn.c_attn.bias": "model-00028-of-00082.safetensors",
"transformer.h.26.attn.c_attn.weight": "model-00028-of-00082.safetensors",
"transformer.h.26.attn.c_proj.weight": "model-00028-of-00082.safetensors",
"transformer.h.26.ln_1.weight": "model-00027-of-00082.safetensors",
"transformer.h.26.ln_2.weight": "model-00028-of-00082.safetensors",
"transformer.h.26.mlp.c_proj.weight": "model-00028-of-00082.safetensors",
"transformer.h.26.mlp.w1.weight": "model-00028-of-00082.safetensors",
"transformer.h.26.mlp.w2.weight": "model-00028-of-00082.safetensors",
"transformer.h.27.attn.c_attn.bias": "model-00029-of-00082.safetensors",
"transformer.h.27.attn.c_attn.weight": "model-00029-of-00082.safetensors",
"transformer.h.27.attn.c_proj.weight": "model-00029-of-00082.safetensors",
"transformer.h.27.ln_1.weight": "model-00028-of-00082.safetensors",
"transformer.h.27.ln_2.weight": "model-00029-of-00082.safetensors",
"transformer.h.27.mlp.c_proj.weight": "model-00029-of-00082.safetensors",
"transformer.h.27.mlp.w1.weight": "model-00029-of-00082.safetensors",
"transformer.h.27.mlp.w2.weight": "model-00029-of-00082.safetensors",
"transformer.h.28.attn.c_attn.bias": "model-00030-of-00082.safetensors",
"transformer.h.28.attn.c_attn.weight": "model-00030-of-00082.safetensors",
"transformer.h.28.attn.c_proj.weight": "model-00030-of-00082.safetensors",
"transformer.h.28.ln_1.weight": "model-00029-of-00082.safetensors",
"transformer.h.28.ln_2.weight": "model-00030-of-00082.safetensors",
"transformer.h.28.mlp.c_proj.weight": "model-00030-of-00082.safetensors",
"transformer.h.28.mlp.w1.weight": "model-00030-of-00082.safetensors",
"transformer.h.28.mlp.w2.weight": "model-00030-of-00082.safetensors",
"transformer.h.29.attn.c_attn.bias": "model-00031-of-00082.safetensors",
"transformer.h.29.attn.c_attn.weight": "model-00031-of-00082.safetensors",
"transformer.h.29.attn.c_proj.weight": "model-00031-of-00082.safetensors",
"transformer.h.29.ln_1.weight": "model-00030-of-00082.safetensors",
"transformer.h.29.ln_2.weight": "model-00031-of-00082.safetensors",
"transformer.h.29.mlp.c_proj.weight": "model-00031-of-00082.safetensors",
"transformer.h.29.mlp.w1.weight": "model-00031-of-00082.safetensors",
"transformer.h.29.mlp.w2.weight": "model-00031-of-00082.safetensors",
"transformer.h.3.attn.c_attn.bias": "model-00005-of-00082.safetensors",
"transformer.h.3.attn.c_attn.weight": "model-00005-of-00082.safetensors",
"transformer.h.3.attn.c_proj.weight": "model-00005-of-00082.safetensors",
"transformer.h.3.ln_1.weight": "model-00004-of-00082.safetensors",
"transformer.h.3.ln_2.weight": "model-00005-of-00082.safetensors",
"transformer.h.3.mlp.c_proj.weight": "model-00005-of-00082.safetensors",
"transformer.h.3.mlp.w1.weight": "model-00005-of-00082.safetensors",
"transformer.h.3.mlp.w2.weight": "model-00005-of-00082.safetensors",
"transformer.h.30.attn.c_attn.bias": "model-00032-of-00082.safetensors",
"transformer.h.30.attn.c_attn.weight": "model-00032-of-00082.safetensors",
"transformer.h.30.attn.c_proj.weight": "model-00032-of-00082.safetensors",
"transformer.h.30.ln_1.weight": "model-00031-of-00082.safetensors",
"transformer.h.30.ln_2.weight": "model-00032-of-00082.safetensors",
"transformer.h.30.mlp.c_proj.weight": "model-00032-of-00082.safetensors",
"transformer.h.30.mlp.w1.weight": "model-00032-of-00082.safetensors",
"transformer.h.30.mlp.w2.weight": "model-00032-of-00082.safetensors",
"transformer.h.31.attn.c_attn.bias": "model-00033-of-00082.safetensors",
"transformer.h.31.attn.c_attn.weight": "model-00033-of-00082.safetensors",
"transformer.h.31.attn.c_proj.weight": "model-00033-of-00082.safetensors",
"transformer.h.31.ln_1.weight": "model-00032-of-00082.safetensors",
"transformer.h.31.ln_2.weight": "model-00033-of-00082.safetensors",
"transformer.h.31.mlp.c_proj.weight": "model-00033-of-00082.safetensors",
"transformer.h.31.mlp.w1.weight": "model-00033-of-00082.safetensors",
"transformer.h.31.mlp.w2.weight": "model-00033-of-00082.safetensors",
"transformer.h.32.attn.c_attn.bias": "model-00034-of-00082.safetensors",
"transformer.h.32.attn.c_attn.weight": "model-00034-of-00082.safetensors",
"transformer.h.32.attn.c_proj.weight": "model-00034-of-00082.safetensors",
"transformer.h.32.ln_1.weight": "model-00033-of-00082.safetensors",
"transformer.h.32.ln_2.weight": "model-00034-of-00082.safetensors",
"transformer.h.32.mlp.c_proj.weight": "model-00034-of-00082.safetensors",
"transformer.h.32.mlp.w1.weight": "model-00034-of-00082.safetensors",
"transformer.h.32.mlp.w2.weight": "model-00034-of-00082.safetensors",
"transformer.h.33.attn.c_attn.bias": "model-00035-of-00082.safetensors",
"transformer.h.33.attn.c_attn.weight": "model-00035-of-00082.safetensors",
"transformer.h.33.attn.c_proj.weight": "model-00035-of-00082.safetensors",
"transformer.h.33.ln_1.weight": "model-00034-of-00082.safetensors",
"transformer.h.33.ln_2.weight": "model-00035-of-00082.safetensors",
"transformer.h.33.mlp.c_proj.weight": "model-00035-of-00082.safetensors",
"transformer.h.33.mlp.w1.weight": "model-00035-of-00082.safetensors",
"transformer.h.33.mlp.w2.weight": "model-00035-of-00082.safetensors",
"transformer.h.34.attn.c_attn.bias": "model-00036-of-00082.safetensors",
"transformer.h.34.attn.c_attn.weight": "model-00036-of-00082.safetensors",
"transformer.h.34.attn.c_proj.weight": "model-00036-of-00082.safetensors",
"transformer.h.34.ln_1.weight": "model-00035-of-00082.safetensors",
"transformer.h.34.ln_2.weight": "model-00036-of-00082.safetensors",
"transformer.h.34.mlp.c_proj.weight": "model-00036-of-00082.safetensors",
"transformer.h.34.mlp.w1.weight": "model-00036-of-00082.safetensors",
"transformer.h.34.mlp.w2.weight": "model-00036-of-00082.safetensors",
"transformer.h.35.attn.c_attn.bias": "model-00037-of-00082.safetensors",
"transformer.h.35.attn.c_attn.weight": "model-00037-of-00082.safetensors",
"transformer.h.35.attn.c_proj.weight": "model-00037-of-00082.safetensors",
"transformer.h.35.ln_1.weight": "model-00036-of-00082.safetensors",
"transformer.h.35.ln_2.weight": "model-00037-of-00082.safetensors",
"transformer.h.35.mlp.c_proj.weight": "model-00037-of-00082.safetensors",
"transformer.h.35.mlp.w1.weight": "model-00037-of-00082.safetensors",
"transformer.h.35.mlp.w2.weight": "model-00037-of-00082.safetensors",
"transformer.h.36.attn.c_attn.bias": "model-00038-of-00082.safetensors",
"transformer.h.36.attn.c_attn.weight": "model-00038-of-00082.safetensors",
"transformer.h.36.attn.c_proj.weight": "model-00038-of-00082.safetensors",
"transformer.h.36.ln_1.weight": "model-00037-of-00082.safetensors",
"transformer.h.36.ln_2.weight": "model-00038-of-00082.safetensors",
"transformer.h.36.mlp.c_proj.weight": "model-00038-of-00082.safetensors",
"transformer.h.36.mlp.w1.weight": "model-00038-of-00082.safetensors",
"transformer.h.36.mlp.w2.weight": "model-00038-of-00082.safetensors",
"transformer.h.37.attn.c_attn.bias": "model-00039-of-00082.safetensors",
"transformer.h.37.attn.c_attn.weight": "model-00039-of-00082.safetensors",
"transformer.h.37.attn.c_proj.weight": "model-00039-of-00082.safetensors",
"transformer.h.37.ln_1.weight": "model-00038-of-00082.safetensors",
"transformer.h.37.ln_2.weight": "model-00039-of-00082.safetensors",
"transformer.h.37.mlp.c_proj.weight": "model-00039-of-00082.safetensors",
"transformer.h.37.mlp.w1.weight": "model-00039-of-00082.safetensors",
"transformer.h.37.mlp.w2.weight": "model-00039-of-00082.safetensors",
"transformer.h.38.attn.c_attn.bias": "model-00040-of-00082.safetensors",
"transformer.h.38.attn.c_attn.weight": "model-00040-of-00082.safetensors",
"transformer.h.38.attn.c_proj.weight": "model-00040-of-00082.safetensors",
"transformer.h.38.ln_1.weight": "model-00039-of-00082.safetensors",
"transformer.h.38.ln_2.weight": "model-00040-of-00082.safetensors",
"transformer.h.38.mlp.c_proj.weight": "model-00040-of-00082.safetensors",
"transformer.h.38.mlp.w1.weight": "model-00040-of-00082.safetensors",
"transformer.h.38.mlp.w2.weight": "model-00040-of-00082.safetensors",
"transformer.h.39.attn.c_attn.bias": "model-00041-of-00082.safetensors",
"transformer.h.39.attn.c_attn.weight": "model-00041-of-00082.safetensors",
"transformer.h.39.attn.c_proj.weight": "model-00041-of-00082.safetensors",
"transformer.h.39.ln_1.weight": "model-00040-of-00082.safetensors",
"transformer.h.39.ln_2.weight": "model-00041-of-00082.safetensors",
"transformer.h.39.mlp.c_proj.weight": "model-00041-of-00082.safetensors",
"transformer.h.39.mlp.w1.weight": "model-00041-of-00082.safetensors",
"transformer.h.39.mlp.w2.weight": "model-00041-of-00082.safetensors",
"transformer.h.4.attn.c_attn.bias": "model-00006-of-00082.safetensors",
"transformer.h.4.attn.c_attn.weight": "model-00006-of-00082.safetensors",
"transformer.h.4.attn.c_proj.weight": "model-00006-of-00082.safetensors",
"transformer.h.4.ln_1.weight": "model-00005-of-00082.safetensors",
"transformer.h.4.ln_2.weight": "model-00006-of-00082.safetensors",
"transformer.h.4.mlp.c_proj.weight": "model-00006-of-00082.safetensors",
"transformer.h.4.mlp.w1.weight": "model-00006-of-00082.safetensors",
"transformer.h.4.mlp.w2.weight": "model-00006-of-00082.safetensors",
"transformer.h.40.attn.c_attn.bias": "model-00042-of-00082.safetensors",
"transformer.h.40.attn.c_attn.weight": "model-00042-of-00082.safetensors",
"transformer.h.40.attn.c_proj.weight": "model-00042-of-00082.safetensors",
"transformer.h.40.ln_1.weight": "model-00041-of-00082.safetensors",
"transformer.h.40.ln_2.weight": "model-00042-of-00082.safetensors",
"transformer.h.40.mlp.c_proj.weight": "model-00042-of-00082.safetensors",
"transformer.h.40.mlp.w1.weight": "model-00042-of-00082.safetensors",
"transformer.h.40.mlp.w2.weight": "model-00042-of-00082.safetensors",
"transformer.h.41.attn.c_attn.bias": "model-00043-of-00082.safetensors",
"transformer.h.41.attn.c_attn.weight": "model-00043-of-00082.safetensors",
"transformer.h.41.attn.c_proj.weight": "model-00043-of-00082.safetensors",
"transformer.h.41.ln_1.weight": "model-00042-of-00082.safetensors",
"transformer.h.41.ln_2.weight": "model-00043-of-00082.safetensors",
"transformer.h.41.mlp.c_proj.weight": "model-00043-of-00082.safetensors",
"transformer.h.41.mlp.w1.weight": "model-00043-of-00082.safetensors",
"transformer.h.41.mlp.w2.weight": "model-00043-of-00082.safetensors",
"transformer.h.42.attn.c_attn.bias": "model-00044-of-00082.safetensors",
"transformer.h.42.attn.c_attn.weight": "model-00044-of-00082.safetensors",
"transformer.h.42.attn.c_proj.weight": "model-00044-of-00082.safetensors",
"transformer.h.42.ln_1.weight": "model-00043-of-00082.safetensors",
"transformer.h.42.ln_2.weight": "model-00044-of-00082.safetensors",
"transformer.h.42.mlp.c_proj.weight": "model-00044-of-00082.safetensors",
"transformer.h.42.mlp.w1.weight": "model-00044-of-00082.safetensors",
"transformer.h.42.mlp.w2.weight": "model-00044-of-00082.safetensors",
"transformer.h.43.attn.c_attn.bias": "model-00045-of-00082.safetensors",
"transformer.h.43.attn.c_attn.weight": "model-00045-of-00082.safetensors",
"transformer.h.43.attn.c_proj.weight": "model-00045-of-00082.safetensors",
"transformer.h.43.ln_1.weight": "model-00044-of-00082.safetensors",
"transformer.h.43.ln_2.weight": "model-00045-of-00082.safetensors",
"transformer.h.43.mlp.c_proj.weight": "model-00045-of-00082.safetensors",
"transformer.h.43.mlp.w1.weight": "model-00045-of-00082.safetensors",
"transformer.h.43.mlp.w2.weight": "model-00045-of-00082.safetensors",
"transformer.h.44.attn.c_attn.bias": "model-00046-of-00082.safetensors",
"transformer.h.44.attn.c_attn.weight": "model-00046-of-00082.safetensors",
"transformer.h.44.attn.c_proj.weight": "model-00046-of-00082.safetensors",
"transformer.h.44.ln_1.weight": "model-00045-of-00082.safetensors",
"transformer.h.44.ln_2.weight": "model-00046-of-00082.safetensors",
"transformer.h.44.mlp.c_proj.weight": "model-00046-of-00082.safetensors",
"transformer.h.44.mlp.w1.weight": "model-00046-of-00082.safetensors",
"transformer.h.44.mlp.w2.weight": "model-00046-of-00082.safetensors",
"transformer.h.45.attn.c_attn.bias": "model-00047-of-00082.safetensors",
"transformer.h.45.attn.c_attn.weight": "model-00047-of-00082.safetensors",
"transformer.h.45.attn.c_proj.weight": "model-00047-of-00082.safetensors",
"transformer.h.45.ln_1.weight": "model-00046-of-00082.safetensors",
"transformer.h.45.ln_2.weight": "model-00047-of-00082.safetensors",
"transformer.h.45.mlp.c_proj.weight": "model-00047-of-00082.safetensors",
"transformer.h.45.mlp.w1.weight": "model-00047-of-00082.safetensors",
"transformer.h.45.mlp.w2.weight": "model-00047-of-00082.safetensors",
"transformer.h.46.attn.c_attn.bias": "model-00048-of-00082.safetensors",
"transformer.h.46.attn.c_attn.weight": "model-00048-of-00082.safetensors",
"transformer.h.46.attn.c_proj.weight": "model-00048-of-00082.safetensors",
"transformer.h.46.ln_1.weight": "model-00047-of-00082.safetensors",
"transformer.h.46.ln_2.weight": "model-00048-of-00082.safetensors",
"transformer.h.46.mlp.c_proj.weight": "model-00048-of-00082.safetensors",
"transformer.h.46.mlp.w1.weight": "model-00048-of-00082.safetensors",
"transformer.h.46.mlp.w2.weight": "model-00048-of-00082.safetensors",
"transformer.h.47.attn.c_attn.bias": "model-00049-of-00082.safetensors",
"transformer.h.47.attn.c_attn.weight": "model-00049-of-00082.safetensors",
"transformer.h.47.attn.c_proj.weight": "model-00049-of-00082.safetensors",
"transformer.h.47.ln_1.weight": "model-00048-of-00082.safetensors",
"transformer.h.47.ln_2.weight": "model-00049-of-00082.safetensors",
"transformer.h.47.mlp.c_proj.weight": "model-00049-of-00082.safetensors",
"transformer.h.47.mlp.w1.weight": "model-00049-of-00082.safetensors",
"transformer.h.47.mlp.w2.weight": "model-00049-of-00082.safetensors",
"transformer.h.48.attn.c_attn.bias": "model-00050-of-00082.safetensors",
"transformer.h.48.attn.c_attn.weight": "model-00050-of-00082.safetensors",
"transformer.h.48.attn.c_proj.weight": "model-00050-of-00082.safetensors",
"transformer.h.48.ln_1.weight": "model-00049-of-00082.safetensors",
"transformer.h.48.ln_2.weight": "model-00050-of-00082.safetensors",
"transformer.h.48.mlp.c_proj.weight": "model-00050-of-00082.safetensors",
"transformer.h.48.mlp.w1.weight": "model-00050-of-00082.safetensors",
"transformer.h.48.mlp.w2.weight": "model-00050-of-00082.safetensors",
"transformer.h.49.attn.c_attn.bias": "model-00051-of-00082.safetensors",
"transformer.h.49.attn.c_attn.weight": "model-00051-of-00082.safetensors",
"transformer.h.49.attn.c_proj.weight": "model-00051-of-00082.safetensors",
"transformer.h.49.ln_1.weight": "model-00050-of-00082.safetensors",
"transformer.h.49.ln_2.weight": "model-00051-of-00082.safetensors",
"transformer.h.49.mlp.c_proj.weight": "model-00051-of-00082.safetensors",
"transformer.h.49.mlp.w1.weight": "model-00051-of-00082.safetensors",
"transformer.h.49.mlp.w2.weight": "model-00051-of-00082.safetensors",
"transformer.h.5.attn.c_attn.bias": "model-00007-of-00082.safetensors",
"transformer.h.5.attn.c_attn.weight": "model-00007-of-00082.safetensors",
"transformer.h.5.attn.c_proj.weight": "model-00007-of-00082.safetensors",
"transformer.h.5.ln_1.weight": "model-00006-of-00082.safetensors",
"transformer.h.5.ln_2.weight": "model-00007-of-00082.safetensors",
"transformer.h.5.mlp.c_proj.weight": "model-00007-of-00082.safetensors",
"transformer.h.5.mlp.w1.weight": "model-00007-of-00082.safetensors",
"transformer.h.5.mlp.w2.weight": "model-00007-of-00082.safetensors",
"transformer.h.50.attn.c_attn.bias": "model-00052-of-00082.safetensors",
"transformer.h.50.attn.c_attn.weight": "model-00052-of-00082.safetensors",
"transformer.h.50.attn.c_proj.weight": "model-00052-of-00082.safetensors",
"transformer.h.50.ln_1.weight": "model-00051-of-00082.safetensors",
"transformer.h.50.ln_2.weight": "model-00052-of-00082.safetensors",
"transformer.h.50.mlp.c_proj.weight": "model-00052-of-00082.safetensors",
"transformer.h.50.mlp.w1.weight": "model-00052-of-00082.safetensors",
"transformer.h.50.mlp.w2.weight": "model-00052-of-00082.safetensors",
"transformer.h.51.attn.c_attn.bias": "model-00053-of-00082.safetensors",
"transformer.h.51.attn.c_attn.weight": "model-00053-of-00082.safetensors",
"transformer.h.51.attn.c_proj.weight": "model-00053-of-00082.safetensors",
"transformer.h.51.ln_1.weight": "model-00052-of-00082.safetensors",
"transformer.h.51.ln_2.weight": "model-00053-of-00082.safetensors",
"transformer.h.51.mlp.c_proj.weight": "model-00053-of-00082.safetensors",
"transformer.h.51.mlp.w1.weight": "model-00053-of-00082.safetensors",
"transformer.h.51.mlp.w2.weight": "model-00053-of-00082.safetensors",
"transformer.h.52.attn.c_attn.bias": "model-00054-of-00082.safetensors",
"transformer.h.52.attn.c_attn.weight": "model-00054-of-00082.safetensors",
"transformer.h.52.attn.c_proj.weight": "model-00054-of-00082.safetensors",
"transformer.h.52.ln_1.weight": "model-00053-of-00082.safetensors",
"transformer.h.52.ln_2.weight": "model-00054-of-00082.safetensors",
"transformer.h.52.mlp.c_proj.weight": "model-00054-of-00082.safetensors",
"transformer.h.52.mlp.w1.weight": "model-00054-of-00082.safetensors",
"transformer.h.52.mlp.w2.weight": "model-00054-of-00082.safetensors",
"transformer.h.53.attn.c_attn.bias": "model-00055-of-00082.safetensors",
"transformer.h.53.attn.c_attn.weight": "model-00055-of-00082.safetensors",
"transformer.h.53.attn.c_proj.weight": "model-00055-of-00082.safetensors",
"transformer.h.53.ln_1.weight": "model-00054-of-00082.safetensors",
"transformer.h.53.ln_2.weight": "model-00055-of-00082.safetensors",
"transformer.h.53.mlp.c_proj.weight": "model-00055-of-00082.safetensors",
"transformer.h.53.mlp.w1.weight": "model-00055-of-00082.safetensors",
"transformer.h.53.mlp.w2.weight": "model-00055-of-00082.safetensors",
"transformer.h.54.attn.c_attn.bias": "model-00056-of-00082.safetensors",
"transformer.h.54.attn.c_attn.weight": "model-00056-of-00082.safetensors",
"transformer.h.54.attn.c_proj.weight": "model-00056-of-00082.safetensors",
"transformer.h.54.ln_1.weight": "model-00055-of-00082.safetensors",
"transformer.h.54.ln_2.weight": "model-00056-of-00082.safetensors",
"transformer.h.54.mlp.c_proj.weight": "model-00056-of-00082.safetensors",
"transformer.h.54.mlp.w1.weight": "model-00056-of-00082.safetensors",
"transformer.h.54.mlp.w2.weight": "model-00056-of-00082.safetensors",
"transformer.h.55.attn.c_attn.bias": "model-00057-of-00082.safetensors",
"transformer.h.55.attn.c_attn.weight": "model-00057-of-00082.safetensors",
"transformer.h.55.attn.c_proj.weight": "model-00057-of-00082.safetensors",
"transformer.h.55.ln_1.weight": "model-00056-of-00082.safetensors",
"transformer.h.55.ln_2.weight": "model-00057-of-00082.safetensors",
"transformer.h.55.mlp.c_proj.weight": "model-00057-of-00082.safetensors",
"transformer.h.55.mlp.w1.weight": "model-00057-of-00082.safetensors",
"transformer.h.55.mlp.w2.weight": "model-00057-of-00082.safetensors",
"transformer.h.56.attn.c_attn.bias": "model-00058-of-00082.safetensors",
"transformer.h.56.attn.c_attn.weight": "model-00058-of-00082.safetensors",
"transformer.h.56.attn.c_proj.weight": "model-00058-of-00082.safetensors",
"transformer.h.56.ln_1.weight": "model-00057-of-00082.safetensors",
"transformer.h.56.ln_2.weight": "model-00058-of-00082.safetensors",
"transformer.h.56.mlp.c_proj.weight": "model-00058-of-00082.safetensors",
"transformer.h.56.mlp.w1.weight": "model-00058-of-00082.safetensors",
"transformer.h.56.mlp.w2.weight": "model-00058-of-00082.safetensors",
"transformer.h.57.attn.c_attn.bias": "model-00059-of-00082.safetensors",
"transformer.h.57.attn.c_attn.weight": "model-00059-of-00082.safetensors",
"transformer.h.57.attn.c_proj.weight": "model-00059-of-00082.safetensors",
"transformer.h.57.ln_1.weight": "model-00058-of-00082.safetensors",
"transformer.h.57.ln_2.weight": "model-00059-of-00082.safetensors",
"transformer.h.57.mlp.c_proj.weight": "model-00059-of-00082.safetensors",
"transformer.h.57.mlp.w1.weight": "model-00059-of-00082.safetensors",
"transformer.h.57.mlp.w2.weight": "model-00059-of-00082.safetensors",
"transformer.h.58.attn.c_attn.bias": "model-00060-of-00082.safetensors",
"transformer.h.58.attn.c_attn.weight": "model-00060-of-00082.safetensors",
"transformer.h.58.attn.c_proj.weight": "model-00060-of-00082.safetensors",
"transformer.h.58.ln_1.weight": "model-00059-of-00082.safetensors",
"transformer.h.58.ln_2.weight": "model-00060-of-00082.safetensors",
"transformer.h.58.mlp.c_proj.weight": "model-00060-of-00082.safetensors",
"transformer.h.58.mlp.w1.weight": "model-00060-of-00082.safetensors",
"transformer.h.58.mlp.w2.weight": "model-00060-of-00082.safetensors",
"transformer.h.59.attn.c_attn.bias": "model-00061-of-00082.safetensors",
"transformer.h.59.attn.c_attn.weight": "model-00061-of-00082.safetensors",
"transformer.h.59.attn.c_proj.weight": "model-00061-of-00082.safetensors",
"transformer.h.59.ln_1.weight": "model-00060-of-00082.safetensors",
"transformer.h.59.ln_2.weight": "model-00061-of-00082.safetensors",
"transformer.h.59.mlp.c_proj.weight": "model-00061-of-00082.safetensors",
"transformer.h.59.mlp.w1.weight": "model-00061-of-00082.safetensors",
"transformer.h.59.mlp.w2.weight": "model-00061-of-00082.safetensors",
"transformer.h.6.attn.c_attn.bias": "model-00008-of-00082.safetensors",
"transformer.h.6.attn.c_attn.weight": "model-00008-of-00082.safetensors",
"transformer.h.6.attn.c_proj.weight": "model-00008-of-00082.safetensors",
"transformer.h.6.ln_1.weight": "model-00007-of-00082.safetensors",
"transformer.h.6.ln_2.weight": "model-00008-of-00082.safetensors",
"transformer.h.6.mlp.c_proj.weight": "model-00008-of-00082.safetensors",
"transformer.h.6.mlp.w1.weight": "model-00008-of-00082.safetensors",
"transformer.h.6.mlp.w2.weight": "model-00008-of-00082.safetensors",
"transformer.h.60.attn.c_attn.bias": "model-00062-of-00082.safetensors",
"transformer.h.60.attn.c_attn.weight": "model-00062-of-00082.safetensors",
"transformer.h.60.attn.c_proj.weight": "model-00062-of-00082.safetensors",
"transformer.h.60.ln_1.weight": "model-00061-of-00082.safetensors",
"transformer.h.60.ln_2.weight": "model-00062-of-00082.safetensors",
"transformer.h.60.mlp.c_proj.weight": "model-00062-of-00082.safetensors",
"transformer.h.60.mlp.w1.weight": "model-00062-of-00082.safetensors",
"transformer.h.60.mlp.w2.weight": "model-00062-of-00082.safetensors",
"transformer.h.61.attn.c_attn.bias": "model-00063-of-00082.safetensors",
"transformer.h.61.attn.c_attn.weight": "model-00063-of-00082.safetensors",
"transformer.h.61.attn.c_proj.weight": "model-00063-of-00082.safetensors",
"transformer.h.61.ln_1.weight": "model-00062-of-00082.safetensors",
"transformer.h.61.ln_2.weight": "model-00063-of-00082.safetensors",
"transformer.h.61.mlp.c_proj.weight": "model-00063-of-00082.safetensors",
"transformer.h.61.mlp.w1.weight": "model-00063-of-00082.safetensors",
"transformer.h.61.mlp.w2.weight": "model-00063-of-00082.safetensors",
"transformer.h.62.attn.c_attn.bias": "model-00064-of-00082.safetensors",
"transformer.h.62.attn.c_attn.weight": "model-00064-of-00082.safetensors",
"transformer.h.62.attn.c_proj.weight": "model-00064-of-00082.safetensors",
"transformer.h.62.ln_1.weight": "model-00063-of-00082.safetensors",
"transformer.h.62.ln_2.weight": "model-00064-of-00082.safetensors",
"transformer.h.62.mlp.c_proj.weight": "model-00064-of-00082.safetensors",
"transformer.h.62.mlp.w1.weight": "model-00064-of-00082.safetensors",
"transformer.h.62.mlp.w2.weight": "model-00064-of-00082.safetensors",
"transformer.h.63.attn.c_attn.bias": "model-00065-of-00082.safetensors",
"transformer.h.63.attn.c_attn.weight": "model-00065-of-00082.safetensors",
"transformer.h.63.attn.c_proj.weight": "model-00065-of-00082.safetensors",
"transformer.h.63.ln_1.weight": "model-00064-of-00082.safetensors",
"transformer.h.63.ln_2.weight": "model-00065-of-00082.safetensors",
"transformer.h.63.mlp.c_proj.weight": "model-00065-of-00082.safetensors",
"transformer.h.63.mlp.w1.weight": "model-00065-of-00082.safetensors",
"transformer.h.63.mlp.w2.weight": "model-00065-of-00082.safetensors",
"transformer.h.64.attn.c_attn.bias": "model-00066-of-00082.safetensors",
"transformer.h.64.attn.c_attn.weight": "model-00066-of-00082.safetensors",
"transformer.h.64.attn.c_proj.weight": "model-00066-of-00082.safetensors",
"transformer.h.64.ln_1.weight": "model-00065-of-00082.safetensors",
"transformer.h.64.ln_2.weight": "model-00066-of-00082.safetensors",
"transformer.h.64.mlp.c_proj.weight": "model-00066-of-00082.safetensors",
"transformer.h.64.mlp.w1.weight": "model-00066-of-00082.safetensors",
"transformer.h.64.mlp.w2.weight": "model-00066-of-00082.safetensors",
"transformer.h.65.attn.c_attn.bias": "model-00067-of-00082.safetensors",
"transformer.h.65.attn.c_attn.weight": "model-00067-of-00082.safetensors",
"transformer.h.65.attn.c_proj.weight": "model-00067-of-00082.safetensors",
"transformer.h.65.ln_1.weight": "model-00066-of-00082.safetensors",
"transformer.h.65.ln_2.weight": "model-00067-of-00082.safetensors",
"transformer.h.65.mlp.c_proj.weight": "model-00067-of-00082.safetensors",
"transformer.h.65.mlp.w1.weight": "model-00067-of-00082.safetensors",
"transformer.h.65.mlp.w2.weight": "model-00067-of-00082.safetensors",
"transformer.h.66.attn.c_attn.bias": "model-00068-of-00082.safetensors",
"transformer.h.66.attn.c_attn.weight": "model-00068-of-00082.safetensors",
"transformer.h.66.attn.c_proj.weight": "model-00068-of-00082.safetensors",
"transformer.h.66.ln_1.weight": "model-00067-of-00082.safetensors",
"transformer.h.66.ln_2.weight": "model-00068-of-00082.safetensors",
"transformer.h.66.mlp.c_proj.weight": "model-00068-of-00082.safetensors",
"transformer.h.66.mlp.w1.weight": "model-00068-of-00082.safetensors",
"transformer.h.66.mlp.w2.weight": "model-00068-of-00082.safetensors",
"transformer.h.67.attn.c_attn.bias": "model-00069-of-00082.safetensors",
"transformer.h.67.attn.c_attn.weight": "model-00069-of-00082.safetensors",
"transformer.h.67.attn.c_proj.weight": "model-00069-of-00082.safetensors",
"transformer.h.67.ln_1.weight": "model-00068-of-00082.safetensors",
"transformer.h.67.ln_2.weight": "model-00069-of-00082.safetensors",
"transformer.h.67.mlp.c_proj.weight": "model-00069-of-00082.safetensors",
"transformer.h.67.mlp.w1.weight": "model-00069-of-00082.safetensors",
"transformer.h.67.mlp.w2.weight": "model-00069-of-00082.safetensors",
"transformer.h.68.attn.c_attn.bias": "model-00070-of-00082.safetensors",
"transformer.h.68.attn.c_attn.weight": "model-00070-of-00082.safetensors",
"transformer.h.68.attn.c_proj.weight": "model-00070-of-00082.safetensors",
"transformer.h.68.ln_1.weight": "model-00069-of-00082.safetensors",
"transformer.h.68.ln_2.weight": "model-00070-of-00082.safetensors",
"transformer.h.68.mlp.c_proj.weight": "model-00070-of-00082.safetensors",
"transformer.h.68.mlp.w1.weight": "model-00070-of-00082.safetensors",
"transformer.h.68.mlp.w2.weight": "model-00070-of-00082.safetensors",
"transformer.h.69.attn.c_attn.bias": "model-00071-of-00082.safetensors",
"transformer.h.69.attn.c_attn.weight": "model-00071-of-00082.safetensors",
"transformer.h.69.attn.c_proj.weight": "model-00071-of-00082.safetensors",
"transformer.h.69.ln_1.weight": "model-00070-of-00082.safetensors",
"transformer.h.69.ln_2.weight": "model-00071-of-00082.safetensors",
"transformer.h.69.mlp.c_proj.weight": "model-00071-of-00082.safetensors",
"transformer.h.69.mlp.w1.weight": "model-00071-of-00082.safetensors",
"transformer.h.69.mlp.w2.weight": "model-00071-of-00082.safetensors",
"transformer.h.7.attn.c_attn.bias": "model-00009-of-00082.safetensors",
"transformer.h.7.attn.c_attn.weight": "model-00009-of-00082.safetensors",
"transformer.h.7.attn.c_proj.weight": "model-00009-of-00082.safetensors",
"transformer.h.7.ln_1.weight": "model-00008-of-00082.safetensors",
"transformer.h.7.ln_2.weight": "model-00009-of-00082.safetensors",
"transformer.h.7.mlp.c_proj.weight": "model-00009-of-00082.safetensors",
"transformer.h.7.mlp.w1.weight": "model-00009-of-00082.safetensors",
"transformer.h.7.mlp.w2.weight": "model-00009-of-00082.safetensors",
"transformer.h.70.attn.c_attn.bias": "model-00072-of-00082.safetensors",
"transformer.h.70.attn.c_attn.weight": "model-00072-of-00082.safetensors",
"transformer.h.70.attn.c_proj.weight": "model-00072-of-00082.safetensors",
"transformer.h.70.ln_1.weight": "model-00071-of-00082.safetensors",
"transformer.h.70.ln_2.weight": "model-00072-of-00082.safetensors",
"transformer.h.70.mlp.c_proj.weight": "model-00072-of-00082.safetensors",
"transformer.h.70.mlp.w1.weight": "model-00072-of-00082.safetensors",
"transformer.h.70.mlp.w2.weight": "model-00072-of-00082.safetensors",
"transformer.h.71.attn.c_attn.bias": "model-00073-of-00082.safetensors",
"transformer.h.71.attn.c_attn.weight": "model-00073-of-00082.safetensors",
"transformer.h.71.attn.c_proj.weight": "model-00073-of-00082.safetensors",
"transformer.h.71.ln_1.weight": "model-00072-of-00082.safetensors",
"transformer.h.71.ln_2.weight": "model-00073-of-00082.safetensors",
"transformer.h.71.mlp.c_proj.weight": "model-00073-of-00082.safetensors",
"transformer.h.71.mlp.w1.weight": "model-00073-of-00082.safetensors",
"transformer.h.71.mlp.w2.weight": "model-00073-of-00082.safetensors",
"transformer.h.72.attn.c_attn.bias": "model-00074-of-00082.safetensors",
"transformer.h.72.attn.c_attn.weight": "model-00074-of-00082.safetensors",
"transformer.h.72.attn.c_proj.weight": "model-00074-of-00082.safetensors",
"transformer.h.72.ln_1.weight": "model-00073-of-00082.safetensors",
"transformer.h.72.ln_2.weight": "model-00074-of-00082.safetensors",
"transformer.h.72.mlp.c_proj.weight": "model-00074-of-00082.safetensors",
"transformer.h.72.mlp.w1.weight": "model-00074-of-00082.safetensors",
"transformer.h.72.mlp.w2.weight": "model-00074-of-00082.safetensors",
"transformer.h.73.attn.c_attn.bias": "model-00075-of-00082.safetensors",
"transformer.h.73.attn.c_attn.weight": "model-00075-of-00082.safetensors",
"transformer.h.73.attn.c_proj.weight": "model-00075-of-00082.safetensors",
"transformer.h.73.ln_1.weight": "model-00074-of-00082.safetensors",
"transformer.h.73.ln_2.weight": "model-00075-of-00082.safetensors",
"transformer.h.73.mlp.c_proj.weight": "model-00075-of-00082.safetensors",
"transformer.h.73.mlp.w1.weight": "model-00075-of-00082.safetensors",
"transformer.h.73.mlp.w2.weight": "model-00075-of-00082.safetensors",
"transformer.h.74.attn.c_attn.bias": "model-00076-of-00082.safetensors",
"transformer.h.74.attn.c_attn.weight": "model-00076-of-00082.safetensors",
"transformer.h.74.attn.c_proj.weight": "model-00076-of-00082.safetensors",
"transformer.h.74.ln_1.weight": "model-00075-of-00082.safetensors",
"transformer.h.74.ln_2.weight": "model-00076-of-00082.safetensors",
"transformer.h.74.mlp.c_proj.weight": "model-00076-of-00082.safetensors",
"transformer.h.74.mlp.w1.weight": "model-00076-of-00082.safetensors",
"transformer.h.74.mlp.w2.weight": "model-00076-of-00082.safetensors",
"transformer.h.75.attn.c_attn.bias": "model-00077-of-00082.safetensors",
"transformer.h.75.attn.c_attn.weight": "model-00077-of-00082.safetensors",
"transformer.h.75.attn.c_proj.weight": "model-00077-of-00082.safetensors",
"transformer.h.75.ln_1.weight": "model-00076-of-00082.safetensors",
"transformer.h.75.ln_2.weight": "model-00077-of-00082.safetensors",
"transformer.h.75.mlp.c_proj.weight": "model-00077-of-00082.safetensors",
"transformer.h.75.mlp.w1.weight": "model-00077-of-00082.safetensors",
"transformer.h.75.mlp.w2.weight": "model-00077-of-00082.safetensors",
"transformer.h.76.attn.c_attn.bias": "model-00078-of-00082.safetensors",
"transformer.h.76.attn.c_attn.weight": "model-00078-of-00082.safetensors",
"transformer.h.76.attn.c_proj.weight": "model-00078-of-00082.safetensors",
"transformer.h.76.ln_1.weight": "model-00077-of-00082.safetensors",
"transformer.h.76.ln_2.weight": "model-00078-of-00082.safetensors",
"transformer.h.76.mlp.c_proj.weight": "model-00078-of-00082.safetensors",
"transformer.h.76.mlp.w1.weight": "model-00078-of-00082.safetensors",
"transformer.h.76.mlp.w2.weight": "model-00078-of-00082.safetensors",
"transformer.h.77.attn.c_attn.bias": "model-00079-of-00082.safetensors",
"transformer.h.77.attn.c_attn.weight": "model-00079-of-00082.safetensors",
"transformer.h.77.attn.c_proj.weight": "model-00079-of-00082.safetensors",
"transformer.h.77.ln_1.weight": "model-00078-of-00082.safetensors",
"transformer.h.77.ln_2.weight": "model-00079-of-00082.safetensors",
"transformer.h.77.mlp.c_proj.weight": "model-00079-of-00082.safetensors",
"transformer.h.77.mlp.w1.weight": "model-00079-of-00082.safetensors",
"transformer.h.77.mlp.w2.weight": "model-00079-of-00082.safetensors",
"transformer.h.78.attn.c_attn.bias": "model-00080-of-00082.safetensors",
"transformer.h.78.attn.c_attn.weight": "model-00080-of-00082.safetensors",
"transformer.h.78.attn.c_proj.weight": "model-00080-of-00082.safetensors",
"transformer.h.78.ln_1.weight": "model-00079-of-00082.safetensors",
"transformer.h.78.ln_2.weight": "model-00080-of-00082.safetensors",
"transformer.h.78.mlp.c_proj.weight": "model-00080-of-00082.safetensors",
"transformer.h.78.mlp.w1.weight": "model-00080-of-00082.safetensors",
"transformer.h.78.mlp.w2.weight": "model-00080-of-00082.safetensors",
"transformer.h.79.attn.c_attn.bias": "model-00081-of-00082.safetensors",
"transformer.h.79.attn.c_attn.weight": "model-00081-of-00082.safetensors",
"transformer.h.79.attn.c_proj.weight": "model-00081-of-00082.safetensors",
"transformer.h.79.ln_1.weight": "model-00080-of-00082.safetensors",
"transformer.h.79.ln_2.weight": "model-00081-of-00082.safetensors",
"transformer.h.79.mlp.c_proj.weight": "model-00081-of-00082.safetensors",
"transformer.h.79.mlp.w1.weight": "model-00081-of-00082.safetensors",
"transformer.h.79.mlp.w2.weight": "model-00081-of-00082.safetensors",
"transformer.h.8.attn.c_attn.bias": "model-00010-of-00082.safetensors",
"transformer.h.8.attn.c_attn.weight": "model-00010-of-00082.safetensors",
"transformer.h.8.attn.c_proj.weight": "model-00010-of-00082.safetensors",
"transformer.h.8.ln_1.weight": "model-00009-of-00082.safetensors",
"transformer.h.8.ln_2.weight": "model-00010-of-00082.safetensors",
"transformer.h.8.mlp.c_proj.weight": "model-00010-of-00082.safetensors",
"transformer.h.8.mlp.w1.weight": "model-00010-of-00082.safetensors",
"transformer.h.8.mlp.w2.weight": "model-00010-of-00082.safetensors",
"transformer.h.9.attn.c_attn.bias": "model-00011-of-00082.safetensors",
"transformer.h.9.attn.c_attn.weight": "model-00011-of-00082.safetensors",
"transformer.h.9.attn.c_proj.weight": "model-00011-of-00082.safetensors",
"transformer.h.9.ln_1.weight": "model-00010-of-00082.safetensors",
"transformer.h.9.ln_2.weight": "model-00011-of-00082.safetensors",
"transformer.h.9.mlp.c_proj.weight": "model-00011-of-00082.safetensors",
"transformer.h.9.mlp.w1.weight": "model-00011-of-00082.safetensors",
"transformer.h.9.mlp.w2.weight": "model-00011-of-00082.safetensors",
"transformer.ln_f.weight": "model-00081-of-00082.safetensors",
"transformer.wte.weight": "model-00001-of-00082.safetensors"
}
}
1
https://gitee.com/hf-models/Qwen-72B-Chat.git
git@gitee.com:hf-models/Qwen-72B-Chat.git
hf-models
Qwen-72B-Chat
Qwen-72B-Chat
main

搜索帮助

53164aa7 5694891 3bd8fe86 5694891