Darok commited on
Commit
04d7ff3
·
verified ·
1 Parent(s): 4b9e141

Upload 6 files

Browse files
README.md CHANGED
@@ -1,3 +1 @@
1
- ---
2
- license: apache-2.0
3
- ---
 
1
+ # converted rwkv6
 
 
model-00001-of-00004.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ce617ceff375af51269a72971d23869664a73329bef9bc27749c07a496619bcd
3
+ size 4248394184
model-00002-of-00004.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ddf2a1f2d89d0de84b64c0ff2ee66f7ab140713a594a3868e5da8aba4098cebe
3
+ size 4211089912
model-00003-of-00004.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca8593fd4bbb2ad6a23eecd771d6f7d774671a4ff8dc488b3c78c112be3eb8a8
3
+ size 4294975960
model-00004-of-00004.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:55545393a2c1eafaaef91bd406b4edaac6da9a9fb33ff4376653005ebadc546e
3
+ size 2281703872
model.safetensors.index.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"metadata": {"total_size": 15036088320}, "weight_map": {"model.blocks.0.att.ln_x.bias": "model-00001-of-00004.safetensors", "model.blocks.0.att.ln_x.weight": "model-00001-of-00004.safetensors", "model.blocks.0.att.time_faaaa": "model-00001-of-00004.safetensors", "model.blocks.0.att.time_mix_g": "model-00001-of-00004.safetensors", "model.blocks.0.att.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.0.att.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.0.att.time_mix_v": "model-00001-of-00004.safetensors", "model.blocks.0.ffn.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.0.ffn.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.0.ln0.bias": "model-00001-of-00004.safetensors", "model.blocks.0.ln0.weight": "model-00001-of-00004.safetensors", "model.blocks.0.ln1.bias": "model-00001-of-00004.safetensors", "model.blocks.0.ln1.weight": "model-00001-of-00004.safetensors", "model.blocks.0.ln2.bias": "model-00001-of-00004.safetensors", "model.blocks.0.ln2.weight": "model-00001-of-00004.safetensors", "model.blocks.1.att.ln_x.bias": "model-00001-of-00004.safetensors", "model.blocks.1.att.ln_x.weight": "model-00001-of-00004.safetensors", "model.blocks.1.att.time_faaaa": "model-00001-of-00004.safetensors", "model.blocks.1.att.time_mix_g": "model-00001-of-00004.safetensors", "model.blocks.1.att.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.1.att.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.1.att.time_mix_v": "model-00001-of-00004.safetensors", "model.blocks.1.ffn.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.1.ffn.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.1.ln1.bias": "model-00001-of-00004.safetensors", "model.blocks.1.ln1.weight": "model-00001-of-00004.safetensors", "model.blocks.1.ln2.bias": "model-00001-of-00004.safetensors", "model.blocks.1.ln2.weight": "model-00001-of-00004.safetensors", "model.blocks.10.att.ln_x.bias": "model-00001-of-00004.safetensors", "model.blocks.10.att.ln_x.weight": "model-00001-of-00004.safetensors", "model.blocks.10.att.time_faaaa": "model-00001-of-00004.safetensors", "model.blocks.10.att.time_mix_g": "model-00001-of-00004.safetensors", "model.blocks.10.att.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.10.att.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.10.att.time_mix_v": "model-00001-of-00004.safetensors", "model.blocks.10.ffn.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.10.ffn.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.10.ln1.bias": "model-00001-of-00004.safetensors", "model.blocks.10.ln1.weight": "model-00001-of-00004.safetensors", "model.blocks.10.ln2.bias": "model-00001-of-00004.safetensors", "model.blocks.10.ln2.weight": "model-00001-of-00004.safetensors", "model.blocks.11.att.ln_x.bias": "model-00001-of-00004.safetensors", "model.blocks.11.att.ln_x.weight": "model-00001-of-00004.safetensors", "model.blocks.11.att.time_faaaa": "model-00001-of-00004.safetensors", "model.blocks.11.att.time_mix_g": "model-00001-of-00004.safetensors", "model.blocks.11.att.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.11.att.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.11.att.time_mix_v": "model-00001-of-00004.safetensors", "model.blocks.11.ffn.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.11.ffn.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.11.ln1.bias": "model-00001-of-00004.safetensors", "model.blocks.11.ln1.weight": "model-00001-of-00004.safetensors", "model.blocks.11.ln2.bias": "model-00001-of-00004.safetensors", "model.blocks.11.ln2.weight": "model-00001-of-00004.safetensors", "model.blocks.12.att.ln_x.bias": "model-00001-of-00004.safetensors", "model.blocks.12.att.ln_x.weight": "model-00001-of-00004.safetensors", "model.blocks.12.att.time_faaaa": "model-00001-of-00004.safetensors", "model.blocks.12.att.time_mix_g": "model-00001-of-00004.safetensors", "model.blocks.12.att.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.12.att.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.12.att.time_mix_v": "model-00001-of-00004.safetensors", "model.blocks.12.ffn.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.12.ffn.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.12.ln1.bias": "model-00001-of-00004.safetensors", "model.blocks.12.ln1.weight": "model-00001-of-00004.safetensors", "model.blocks.12.ln2.bias": "model-00001-of-00004.safetensors", "model.blocks.12.ln2.weight": "model-00001-of-00004.safetensors", "model.blocks.13.att.ln_x.bias": "model-00001-of-00004.safetensors", "model.blocks.13.att.ln_x.weight": "model-00001-of-00004.safetensors", "model.blocks.13.att.time_faaaa": "model-00001-of-00004.safetensors", "model.blocks.13.att.time_mix_g": "model-00001-of-00004.safetensors", "model.blocks.13.att.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.13.att.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.13.att.time_mix_v": "model-00001-of-00004.safetensors", "model.blocks.13.ffn.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.13.ffn.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.13.ln1.bias": "model-00001-of-00004.safetensors", "model.blocks.13.ln1.weight": "model-00001-of-00004.safetensors", "model.blocks.13.ln2.bias": "model-00001-of-00004.safetensors", "model.blocks.13.ln2.weight": "model-00001-of-00004.safetensors", "model.blocks.14.att.ln_x.bias": "model-00001-of-00004.safetensors", "model.blocks.14.att.ln_x.weight": "model-00001-of-00004.safetensors", "model.blocks.14.att.time_faaaa": "model-00001-of-00004.safetensors", "model.blocks.14.att.time_mix_g": "model-00001-of-00004.safetensors", "model.blocks.14.att.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.14.att.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.14.att.time_mix_v": "model-00001-of-00004.safetensors", "model.blocks.14.ffn.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.14.ffn.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.14.ln1.bias": "model-00001-of-00004.safetensors", "model.blocks.14.ln1.weight": "model-00001-of-00004.safetensors", "model.blocks.14.ln2.bias": "model-00001-of-00004.safetensors", "model.blocks.14.ln2.weight": "model-00001-of-00004.safetensors", "model.blocks.15.att.ln_x.bias": "model-00001-of-00004.safetensors", "model.blocks.15.att.ln_x.weight": "model-00001-of-00004.safetensors", "model.blocks.15.att.time_faaaa": "model-00001-of-00004.safetensors", "model.blocks.15.att.time_mix_g": "model-00001-of-00004.safetensors", "model.blocks.15.att.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.15.att.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.15.att.time_mix_v": "model-00001-of-00004.safetensors", "model.blocks.15.ffn.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.15.ffn.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.15.ln1.bias": "model-00001-of-00004.safetensors", "model.blocks.15.ln1.weight": "model-00001-of-00004.safetensors", "model.blocks.15.ln2.bias": "model-00001-of-00004.safetensors", "model.blocks.15.ln2.weight": "model-00001-of-00004.safetensors", "model.blocks.16.att.ln_x.bias": "model-00001-of-00004.safetensors", "model.blocks.16.att.ln_x.weight": "model-00001-of-00004.safetensors", "model.blocks.16.att.time_faaaa": "model-00001-of-00004.safetensors", "model.blocks.16.att.time_mix_g": "model-00001-of-00004.safetensors", "model.blocks.16.att.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.16.att.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.16.att.time_mix_v": "model-00001-of-00004.safetensors", "model.blocks.16.ffn.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.16.ffn.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.16.ln1.bias": "model-00001-of-00004.safetensors", "model.blocks.16.ln1.weight": "model-00001-of-00004.safetensors", "model.blocks.16.ln2.bias": "model-00001-of-00004.safetensors", "model.blocks.16.ln2.weight": "model-00001-of-00004.safetensors", "model.blocks.17.att.ln_x.bias": "model-00001-of-00004.safetensors", "model.blocks.17.att.ln_x.weight": "model-00001-of-00004.safetensors", "model.blocks.17.att.time_faaaa": "model-00001-of-00004.safetensors", "model.blocks.17.att.time_mix_g": "model-00001-of-00004.safetensors", "model.blocks.17.att.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.17.att.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.17.att.time_mix_v": "model-00001-of-00004.safetensors", "model.blocks.17.ffn.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.17.ffn.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.17.ln1.bias": "model-00001-of-00004.safetensors", "model.blocks.17.ln1.weight": "model-00001-of-00004.safetensors", "model.blocks.17.ln2.bias": "model-00001-of-00004.safetensors", "model.blocks.17.ln2.weight": "model-00001-of-00004.safetensors", "model.blocks.18.att.ln_x.bias": "model-00001-of-00004.safetensors", "model.blocks.18.att.ln_x.weight": "model-00001-of-00004.safetensors", "model.blocks.18.att.time_faaaa": "model-00001-of-00004.safetensors", "model.blocks.18.att.time_mix_g": "model-00001-of-00004.safetensors", "model.blocks.18.att.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.18.att.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.18.att.time_mix_v": "model-00001-of-00004.safetensors", "model.blocks.18.ffn.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.18.ffn.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.18.ln1.bias": "model-00001-of-00004.safetensors", "model.blocks.18.ln1.weight": "model-00001-of-00004.safetensors", "model.blocks.18.ln2.bias": "model-00001-of-00004.safetensors", "model.blocks.18.ln2.weight": "model-00001-of-00004.safetensors", "model.blocks.19.att.ln_x.bias": "model-00001-of-00004.safetensors", "model.blocks.19.att.ln_x.weight": "model-00001-of-00004.safetensors", "model.blocks.19.att.time_faaaa": "model-00001-of-00004.safetensors", "model.blocks.19.att.time_mix_g": "model-00001-of-00004.safetensors", "model.blocks.19.att.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.19.att.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.19.att.time_mix_v": "model-00001-of-00004.safetensors", "model.blocks.19.ffn.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.19.ffn.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.19.ln1.bias": "model-00001-of-00004.safetensors", "model.blocks.19.ln1.weight": "model-00001-of-00004.safetensors", "model.blocks.19.ln2.bias": "model-00001-of-00004.safetensors", "model.blocks.19.ln2.weight": "model-00001-of-00004.safetensors", "model.blocks.2.att.ln_x.bias": "model-00001-of-00004.safetensors", "model.blocks.2.att.ln_x.weight": "model-00001-of-00004.safetensors", "model.blocks.2.att.time_faaaa": "model-00001-of-00004.safetensors", "model.blocks.2.att.time_mix_g": "model-00001-of-00004.safetensors", "model.blocks.2.att.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.2.att.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.2.att.time_mix_v": "model-00001-of-00004.safetensors", "model.blocks.2.ffn.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.2.ffn.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.2.ln1.bias": "model-00001-of-00004.safetensors", "model.blocks.2.ln1.weight": "model-00001-of-00004.safetensors", "model.blocks.2.ln2.bias": "model-00001-of-00004.safetensors", "model.blocks.2.ln2.weight": "model-00001-of-00004.safetensors", "model.blocks.20.att.ln_x.bias": "model-00001-of-00004.safetensors", "model.blocks.20.att.ln_x.weight": "model-00001-of-00004.safetensors", "model.blocks.20.att.time_faaaa": "model-00001-of-00004.safetensors", "model.blocks.20.att.time_mix_g": "model-00001-of-00004.safetensors", "model.blocks.20.att.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.20.att.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.20.att.time_mix_v": "model-00001-of-00004.safetensors", "model.blocks.20.ffn.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.20.ffn.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.20.ln1.bias": "model-00001-of-00004.safetensors", "model.blocks.20.ln1.weight": "model-00001-of-00004.safetensors", "model.blocks.20.ln2.bias": "model-00001-of-00004.safetensors", "model.blocks.20.ln2.weight": "model-00001-of-00004.safetensors", "model.blocks.21.att.ln_x.bias": "model-00001-of-00004.safetensors", "model.blocks.21.att.ln_x.weight": "model-00001-of-00004.safetensors", "model.blocks.21.att.time_faaaa": "model-00001-of-00004.safetensors", "model.blocks.21.att.time_mix_g": "model-00001-of-00004.safetensors", "model.blocks.21.att.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.21.att.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.21.att.time_mix_v": "model-00001-of-00004.safetensors", "model.blocks.21.ffn.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.21.ffn.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.21.ln1.bias": "model-00001-of-00004.safetensors", "model.blocks.21.ln1.weight": "model-00001-of-00004.safetensors", "model.blocks.21.ln2.bias": "model-00001-of-00004.safetensors", "model.blocks.21.ln2.weight": "model-00001-of-00004.safetensors", "model.blocks.22.att.ln_x.bias": "model-00001-of-00004.safetensors", "model.blocks.22.att.ln_x.weight": "model-00001-of-00004.safetensors", "model.blocks.22.att.time_faaaa": "model-00001-of-00004.safetensors", "model.blocks.22.att.time_mix_g": "model-00001-of-00004.safetensors", "model.blocks.22.att.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.22.att.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.22.att.time_mix_v": "model-00001-of-00004.safetensors", "model.blocks.22.ffn.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.22.ffn.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.22.ln1.bias": "model-00001-of-00004.safetensors", "model.blocks.22.ln1.weight": "model-00001-of-00004.safetensors", "model.blocks.22.ln2.bias": "model-00001-of-00004.safetensors", "model.blocks.22.ln2.weight": "model-00001-of-00004.safetensors", "model.blocks.23.att.ln_x.bias": "model-00001-of-00004.safetensors", "model.blocks.23.att.ln_x.weight": "model-00001-of-00004.safetensors", "model.blocks.23.att.time_faaaa": "model-00001-of-00004.safetensors", "model.blocks.23.att.time_mix_g": "model-00001-of-00004.safetensors", "model.blocks.23.att.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.23.att.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.23.att.time_mix_v": "model-00001-of-00004.safetensors", "model.blocks.23.ffn.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.23.ffn.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.23.ln1.bias": "model-00001-of-00004.safetensors", "model.blocks.23.ln1.weight": "model-00001-of-00004.safetensors", "model.blocks.23.ln2.bias": "model-00001-of-00004.safetensors", "model.blocks.23.ln2.weight": "model-00001-of-00004.safetensors", "model.blocks.24.att.ln_x.bias": "model-00001-of-00004.safetensors", "model.blocks.24.att.ln_x.weight": "model-00001-of-00004.safetensors", "model.blocks.24.att.time_faaaa": "model-00001-of-00004.safetensors", "model.blocks.24.att.time_mix_g": "model-00001-of-00004.safetensors", "model.blocks.24.att.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.24.att.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.24.att.time_mix_v": "model-00001-of-00004.safetensors", "model.blocks.24.ffn.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.24.ffn.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.24.ln1.bias": "model-00001-of-00004.safetensors", "model.blocks.24.ln1.weight": "model-00001-of-00004.safetensors", "model.blocks.24.ln2.bias": "model-00001-of-00004.safetensors", "model.blocks.24.ln2.weight": "model-00001-of-00004.safetensors", "model.blocks.25.att.ln_x.bias": "model-00001-of-00004.safetensors", "model.blocks.25.att.ln_x.weight": "model-00001-of-00004.safetensors", "model.blocks.25.att.time_faaaa": "model-00001-of-00004.safetensors", "model.blocks.25.att.time_mix_g": "model-00001-of-00004.safetensors", "model.blocks.25.att.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.25.att.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.25.att.time_mix_v": "model-00001-of-00004.safetensors", "model.blocks.25.ffn.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.25.ffn.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.25.ln1.bias": "model-00001-of-00004.safetensors", "model.blocks.25.ln1.weight": "model-00001-of-00004.safetensors", "model.blocks.25.ln2.bias": "model-00001-of-00004.safetensors", "model.blocks.25.ln2.weight": "model-00001-of-00004.safetensors", "model.blocks.26.att.ln_x.bias": "model-00001-of-00004.safetensors", "model.blocks.26.att.ln_x.weight": "model-00001-of-00004.safetensors", "model.blocks.26.att.time_faaaa": "model-00001-of-00004.safetensors", "model.blocks.26.att.time_mix_g": "model-00001-of-00004.safetensors", "model.blocks.26.att.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.26.att.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.26.att.time_mix_v": "model-00001-of-00004.safetensors", "model.blocks.26.ffn.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.26.ffn.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.26.ln1.bias": "model-00001-of-00004.safetensors", "model.blocks.26.ln1.weight": "model-00001-of-00004.safetensors", "model.blocks.26.ln2.bias": "model-00001-of-00004.safetensors", "model.blocks.26.ln2.weight": "model-00001-of-00004.safetensors", "model.blocks.27.att.ln_x.bias": "model-00001-of-00004.safetensors", "model.blocks.27.att.ln_x.weight": "model-00001-of-00004.safetensors", "model.blocks.27.att.time_faaaa": "model-00001-of-00004.safetensors", "model.blocks.27.att.time_mix_g": "model-00001-of-00004.safetensors", "model.blocks.27.att.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.27.att.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.27.att.time_mix_v": "model-00001-of-00004.safetensors", "model.blocks.27.ffn.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.27.ffn.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.27.ln1.bias": "model-00001-of-00004.safetensors", "model.blocks.27.ln1.weight": "model-00001-of-00004.safetensors", "model.blocks.27.ln2.bias": "model-00001-of-00004.safetensors", "model.blocks.27.ln2.weight": "model-00001-of-00004.safetensors", "model.blocks.28.att.ln_x.bias": "model-00001-of-00004.safetensors", "model.blocks.28.att.ln_x.weight": "model-00001-of-00004.safetensors", "model.blocks.28.att.time_faaaa": "model-00001-of-00004.safetensors", "model.blocks.28.att.time_mix_g": "model-00001-of-00004.safetensors", "model.blocks.28.att.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.28.att.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.28.att.time_mix_v": "model-00001-of-00004.safetensors", "model.blocks.28.ffn.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.28.ffn.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.28.ln1.bias": "model-00001-of-00004.safetensors", "model.blocks.28.ln1.weight": "model-00001-of-00004.safetensors", "model.blocks.28.ln2.bias": "model-00001-of-00004.safetensors", "model.blocks.28.ln2.weight": "model-00001-of-00004.safetensors", "model.blocks.29.att.ln_x.bias": "model-00001-of-00004.safetensors", "model.blocks.29.att.ln_x.weight": "model-00001-of-00004.safetensors", "model.blocks.29.att.time_faaaa": "model-00001-of-00004.safetensors", "model.blocks.29.att.time_mix_g": "model-00001-of-00004.safetensors", "model.blocks.29.att.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.29.att.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.29.att.time_mix_v": "model-00001-of-00004.safetensors", "model.blocks.29.ffn.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.29.ffn.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.29.ln1.bias": "model-00001-of-00004.safetensors", "model.blocks.29.ln1.weight": "model-00001-of-00004.safetensors", "model.blocks.29.ln2.bias": "model-00001-of-00004.safetensors", "model.blocks.29.ln2.weight": "model-00001-of-00004.safetensors", "model.blocks.3.att.ln_x.bias": "model-00001-of-00004.safetensors", "model.blocks.3.att.ln_x.weight": "model-00001-of-00004.safetensors", "model.blocks.3.att.time_faaaa": "model-00001-of-00004.safetensors", "model.blocks.3.att.time_mix_g": "model-00001-of-00004.safetensors", "model.blocks.3.att.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.3.att.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.3.att.time_mix_v": "model-00001-of-00004.safetensors", "model.blocks.3.ffn.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.3.ffn.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.3.ln1.bias": "model-00001-of-00004.safetensors", "model.blocks.3.ln1.weight": "model-00001-of-00004.safetensors", "model.blocks.3.ln2.bias": "model-00001-of-00004.safetensors", "model.blocks.3.ln2.weight": "model-00001-of-00004.safetensors", "model.blocks.30.att.ln_x.bias": "model-00001-of-00004.safetensors", "model.blocks.30.att.ln_x.weight": "model-00001-of-00004.safetensors", "model.blocks.30.att.time_faaaa": "model-00001-of-00004.safetensors", "model.blocks.30.att.time_mix_g": "model-00001-of-00004.safetensors", "model.blocks.30.att.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.30.att.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.30.att.time_mix_v": "model-00001-of-00004.safetensors", "model.blocks.30.ffn.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.30.ffn.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.30.ln1.bias": "model-00001-of-00004.safetensors", "model.blocks.30.ln1.weight": "model-00001-of-00004.safetensors", "model.blocks.30.ln2.bias": "model-00001-of-00004.safetensors", "model.blocks.30.ln2.weight": "model-00001-of-00004.safetensors", "model.blocks.31.att.ln_x.bias": "model-00001-of-00004.safetensors", "model.blocks.31.att.ln_x.weight": "model-00001-of-00004.safetensors", "model.blocks.31.att.time_faaaa": "model-00001-of-00004.safetensors", "model.blocks.31.att.time_mix_g": "model-00001-of-00004.safetensors", "model.blocks.31.att.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.31.att.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.31.att.time_mix_v": "model-00001-of-00004.safetensors", "model.blocks.31.ffn.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.31.ffn.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.31.ln1.bias": "model-00001-of-00004.safetensors", "model.blocks.31.ln1.weight": "model-00001-of-00004.safetensors", "model.blocks.31.ln2.bias": "model-00001-of-00004.safetensors", "model.blocks.31.ln2.weight": "model-00001-of-00004.safetensors", "model.blocks.4.att.ln_x.bias": "model-00001-of-00004.safetensors", "model.blocks.4.att.ln_x.weight": "model-00001-of-00004.safetensors", "model.blocks.4.att.time_faaaa": "model-00001-of-00004.safetensors", "model.blocks.4.att.time_mix_g": "model-00001-of-00004.safetensors", "model.blocks.4.att.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.4.att.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.4.att.time_mix_v": "model-00001-of-00004.safetensors", "model.blocks.4.ffn.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.4.ffn.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.4.ln1.bias": "model-00001-of-00004.safetensors", "model.blocks.4.ln1.weight": "model-00001-of-00004.safetensors", "model.blocks.4.ln2.bias": "model-00001-of-00004.safetensors", "model.blocks.4.ln2.weight": "model-00001-of-00004.safetensors", "model.blocks.5.att.ln_x.bias": "model-00001-of-00004.safetensors", "model.blocks.5.att.ln_x.weight": "model-00001-of-00004.safetensors", "model.blocks.5.att.time_faaaa": "model-00001-of-00004.safetensors", "model.blocks.5.att.time_mix_g": "model-00001-of-00004.safetensors", "model.blocks.5.att.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.5.att.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.5.att.time_mix_v": "model-00001-of-00004.safetensors", "model.blocks.5.ffn.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.5.ffn.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.5.ln1.bias": "model-00001-of-00004.safetensors", "model.blocks.5.ln1.weight": "model-00001-of-00004.safetensors", "model.blocks.5.ln2.bias": "model-00001-of-00004.safetensors", "model.blocks.5.ln2.weight": "model-00001-of-00004.safetensors", "model.blocks.6.att.ln_x.bias": "model-00001-of-00004.safetensors", "model.blocks.6.att.ln_x.weight": "model-00001-of-00004.safetensors", "model.blocks.6.att.time_faaaa": "model-00001-of-00004.safetensors", "model.blocks.6.att.time_mix_g": "model-00001-of-00004.safetensors", "model.blocks.6.att.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.6.att.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.6.att.time_mix_v": "model-00001-of-00004.safetensors", "model.blocks.6.ffn.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.6.ffn.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.6.ln1.bias": "model-00001-of-00004.safetensors", "model.blocks.6.ln1.weight": "model-00001-of-00004.safetensors", "model.blocks.6.ln2.bias": "model-00001-of-00004.safetensors", "model.blocks.6.ln2.weight": "model-00001-of-00004.safetensors", "model.blocks.7.att.ln_x.bias": "model-00001-of-00004.safetensors", "model.blocks.7.att.ln_x.weight": "model-00001-of-00004.safetensors", "model.blocks.7.att.time_faaaa": "model-00001-of-00004.safetensors", "model.blocks.7.att.time_mix_g": "model-00001-of-00004.safetensors", "model.blocks.7.att.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.7.att.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.7.att.time_mix_v": "model-00001-of-00004.safetensors", "model.blocks.7.ffn.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.7.ffn.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.7.ln1.bias": "model-00001-of-00004.safetensors", "model.blocks.7.ln1.weight": "model-00001-of-00004.safetensors", "model.blocks.7.ln2.bias": "model-00001-of-00004.safetensors", "model.blocks.7.ln2.weight": "model-00001-of-00004.safetensors", "model.blocks.8.att.ln_x.bias": "model-00001-of-00004.safetensors", "model.blocks.8.att.ln_x.weight": "model-00001-of-00004.safetensors", "model.blocks.8.att.time_faaaa": "model-00001-of-00004.safetensors", "model.blocks.8.att.time_mix_g": "model-00001-of-00004.safetensors", "model.blocks.8.att.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.8.att.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.8.att.time_mix_v": "model-00001-of-00004.safetensors", "model.blocks.8.ffn.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.8.ffn.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.8.ln1.bias": "model-00001-of-00004.safetensors", "model.blocks.8.ln1.weight": "model-00001-of-00004.safetensors", "model.blocks.8.ln2.bias": "model-00001-of-00004.safetensors", "model.blocks.8.ln2.weight": "model-00001-of-00004.safetensors", "model.blocks.9.att.ln_x.bias": "model-00001-of-00004.safetensors", "model.blocks.9.att.ln_x.weight": "model-00001-of-00004.safetensors", "model.blocks.9.att.time_faaaa": "model-00001-of-00004.safetensors", "model.blocks.9.att.time_mix_g": "model-00001-of-00004.safetensors", "model.blocks.9.att.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.9.att.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.9.att.time_mix_v": "model-00001-of-00004.safetensors", "model.blocks.9.ffn.time_mix_k": "model-00001-of-00004.safetensors", "model.blocks.9.ffn.time_mix_r": "model-00001-of-00004.safetensors", "model.blocks.9.ln1.bias": "model-00001-of-00004.safetensors", "model.blocks.9.ln1.weight": "model-00001-of-00004.safetensors", "model.blocks.9.ln2.bias": "model-00001-of-00004.safetensors", "model.blocks.9.ln2.weight": "model-00001-of-00004.safetensors", "model.ln_out.bias": "model-00001-of-00004.safetensors", "model.ln_out.weight": "model-00001-of-00004.safetensors", "model.blocks.0.att.time_decay": "model-00001-of-00004.safetensors", "model.blocks.1.att.time_decay": "model-00001-of-00004.safetensors", "model.blocks.10.att.time_decay": "model-00001-of-00004.safetensors", "model.blocks.11.att.time_decay": "model-00001-of-00004.safetensors", "model.blocks.12.att.time_decay": "model-00001-of-00004.safetensors", "model.blocks.13.att.time_decay": "model-00001-of-00004.safetensors", "model.blocks.14.att.time_decay": "model-00001-of-00004.safetensors", "model.blocks.15.att.time_decay": "model-00001-of-00004.safetensors", "model.blocks.16.att.time_decay": "model-00001-of-00004.safetensors", "model.blocks.17.att.time_decay": "model-00001-of-00004.safetensors", "model.blocks.18.att.time_decay": "model-00001-of-00004.safetensors", "model.blocks.19.att.time_decay": "model-00001-of-00004.safetensors", "model.blocks.2.att.time_decay": "model-00001-of-00004.safetensors", "model.blocks.20.att.time_decay": "model-00001-of-00004.safetensors", "model.blocks.21.att.time_decay": "model-00001-of-00004.safetensors", "model.blocks.22.att.time_decay": "model-00001-of-00004.safetensors", "model.blocks.23.att.time_decay": "model-00001-of-00004.safetensors", "model.blocks.24.att.time_decay": "model-00001-of-00004.safetensors", "model.blocks.25.att.time_decay": "model-00001-of-00004.safetensors", "model.blocks.26.att.time_decay": "model-00001-of-00004.safetensors", "model.blocks.27.att.time_decay": "model-00001-of-00004.safetensors", "model.blocks.28.att.time_decay": "model-00001-of-00004.safetensors", "model.blocks.29.att.time_decay": "model-00001-of-00004.safetensors", "model.blocks.3.att.time_decay": "model-00001-of-00004.safetensors", "model.blocks.30.att.time_decay": "model-00001-of-00004.safetensors", "model.blocks.31.att.time_decay": "model-00001-of-00004.safetensors", "model.blocks.4.att.time_decay": "model-00001-of-00004.safetensors", "model.blocks.5.att.time_decay": "model-00001-of-00004.safetensors", "model.blocks.6.att.time_decay": "model-00001-of-00004.safetensors", "model.blocks.7.att.time_decay": "model-00001-of-00004.safetensors", "model.blocks.8.att.time_decay": "model-00001-of-00004.safetensors", "model.blocks.9.att.time_decay": "model-00001-of-00004.safetensors", "model.blocks.0.att.gate.weight": "model-00001-of-00004.safetensors", "model.blocks.0.att.key.weight": "model-00001-of-00004.safetensors", "model.blocks.0.att.output.weight": "model-00001-of-00004.safetensors", "model.blocks.0.att.receptance.weight": "model-00001-of-00004.safetensors", "model.blocks.0.att.value.weight": "model-00001-of-00004.safetensors", "model.blocks.0.ffn.key.weight": "model-00001-of-00004.safetensors", "model.blocks.0.ffn.receptance.weight": "model-00001-of-00004.safetensors", "model.blocks.0.ffn.value.weight": "model-00001-of-00004.safetensors", "model.blocks.1.att.gate.weight": "model-00001-of-00004.safetensors", "model.blocks.1.att.key.weight": "model-00001-of-00004.safetensors", "model.blocks.1.att.output.weight": "model-00001-of-00004.safetensors", "model.blocks.1.att.receptance.weight": "model-00001-of-00004.safetensors", "model.blocks.1.att.value.weight": "model-00001-of-00004.safetensors", "model.blocks.1.ffn.key.weight": "model-00001-of-00004.safetensors", "model.blocks.1.ffn.receptance.weight": "model-00001-of-00004.safetensors", "model.blocks.1.ffn.value.weight": "model-00001-of-00004.safetensors", "model.blocks.10.att.gate.weight": "model-00001-of-00004.safetensors", "model.blocks.10.att.key.weight": "model-00001-of-00004.safetensors", "model.blocks.10.att.output.weight": "model-00001-of-00004.safetensors", "model.blocks.10.att.receptance.weight": "model-00001-of-00004.safetensors", "model.blocks.10.att.value.weight": "model-00001-of-00004.safetensors", "model.blocks.10.ffn.key.weight": "model-00001-of-00004.safetensors", "model.blocks.10.ffn.receptance.weight": "model-00001-of-00004.safetensors", "model.blocks.10.ffn.value.weight": "model-00001-of-00004.safetensors", "model.blocks.11.att.gate.weight": "model-00001-of-00004.safetensors", "model.blocks.11.att.key.weight": "model-00001-of-00004.safetensors", "model.blocks.11.att.output.weight": "model-00001-of-00004.safetensors", "model.blocks.11.att.receptance.weight": "model-00001-of-00004.safetensors", "model.blocks.11.att.value.weight": "model-00001-of-00004.safetensors", "model.blocks.11.ffn.key.weight": "model-00001-of-00004.safetensors", "model.blocks.11.ffn.receptance.weight": "model-00001-of-00004.safetensors", "model.blocks.11.ffn.value.weight": "model-00001-of-00004.safetensors", "model.blocks.12.att.gate.weight": "model-00001-of-00004.safetensors", "model.blocks.12.att.key.weight": "model-00001-of-00004.safetensors", "model.blocks.12.att.output.weight": "model-00001-of-00004.safetensors", "model.blocks.12.att.receptance.weight": "model-00001-of-00004.safetensors", "model.blocks.12.att.value.weight": "model-00001-of-00004.safetensors", "model.blocks.12.ffn.key.weight": "model-00001-of-00004.safetensors", "model.blocks.12.ffn.receptance.weight": "model-00001-of-00004.safetensors", "model.blocks.12.ffn.value.weight": "model-00001-of-00004.safetensors", "model.blocks.13.att.gate.weight": "model-00001-of-00004.safetensors", "model.blocks.13.att.key.weight": "model-00001-of-00004.safetensors", "model.blocks.13.att.output.weight": "model-00001-of-00004.safetensors", "model.blocks.13.att.receptance.weight": "model-00001-of-00004.safetensors", "model.blocks.13.att.value.weight": "model-00001-of-00004.safetensors", "model.blocks.13.ffn.key.weight": "model-00001-of-00004.safetensors", "model.blocks.13.ffn.receptance.weight": "model-00001-of-00004.safetensors", "model.blocks.13.ffn.value.weight": "model-00001-of-00004.safetensors", "model.blocks.14.att.gate.weight": "model-00001-of-00004.safetensors", "model.blocks.14.att.key.weight": "model-00001-of-00004.safetensors", "model.blocks.14.att.output.weight": "model-00001-of-00004.safetensors", "model.blocks.14.att.receptance.weight": "model-00001-of-00004.safetensors", "model.blocks.14.att.value.weight": "model-00001-of-00004.safetensors", "model.blocks.14.ffn.key.weight": "model-00001-of-00004.safetensors", "model.blocks.14.ffn.receptance.weight": "model-00001-of-00004.safetensors", "model.blocks.14.ffn.value.weight": "model-00001-of-00004.safetensors", "model.blocks.15.att.gate.weight": "model-00001-of-00004.safetensors", "model.blocks.15.att.key.weight": "model-00001-of-00004.safetensors", "model.blocks.15.att.output.weight": "model-00001-of-00004.safetensors", "model.blocks.15.att.receptance.weight": "model-00001-of-00004.safetensors", "model.blocks.15.att.value.weight": "model-00001-of-00004.safetensors", "model.blocks.15.ffn.key.weight": "model-00001-of-00004.safetensors", "model.blocks.15.ffn.receptance.weight": "model-00001-of-00004.safetensors", "model.blocks.15.ffn.value.weight": "model-00001-of-00004.safetensors", "model.blocks.16.att.gate.weight": "model-00001-of-00004.safetensors", "model.blocks.16.att.key.weight": "model-00001-of-00004.safetensors", "model.blocks.16.att.output.weight": "model-00001-of-00004.safetensors", "model.blocks.16.att.receptance.weight": "model-00001-of-00004.safetensors", "model.blocks.16.att.value.weight": "model-00001-of-00004.safetensors", "model.blocks.16.ffn.key.weight": "model-00001-of-00004.safetensors", "model.blocks.16.ffn.receptance.weight": "model-00001-of-00004.safetensors", "model.blocks.16.ffn.value.weight": "model-00001-of-00004.safetensors", "model.blocks.17.att.gate.weight": "model-00001-of-00004.safetensors", "model.blocks.17.att.key.weight": "model-00001-of-00004.safetensors", "model.blocks.17.att.output.weight": "model-00001-of-00004.safetensors", "model.blocks.17.att.receptance.weight": "model-00001-of-00004.safetensors", "model.blocks.17.att.value.weight": "model-00001-of-00004.safetensors", "model.blocks.17.ffn.key.weight": "model-00001-of-00004.safetensors", "model.blocks.17.ffn.receptance.weight": "model-00001-of-00004.safetensors", "model.blocks.17.ffn.value.weight": "model-00002-of-00004.safetensors", "model.blocks.18.att.gate.weight": "model-00002-of-00004.safetensors", "model.blocks.18.att.key.weight": "model-00002-of-00004.safetensors", "model.blocks.18.att.output.weight": "model-00002-of-00004.safetensors", "model.blocks.18.att.receptance.weight": "model-00002-of-00004.safetensors", "model.blocks.18.att.value.weight": "model-00002-of-00004.safetensors", "model.blocks.18.ffn.key.weight": "model-00002-of-00004.safetensors", "model.blocks.18.ffn.receptance.weight": "model-00002-of-00004.safetensors", "model.blocks.18.ffn.value.weight": "model-00002-of-00004.safetensors", "model.blocks.19.att.gate.weight": "model-00002-of-00004.safetensors", "model.blocks.19.att.key.weight": "model-00002-of-00004.safetensors", "model.blocks.19.att.output.weight": "model-00002-of-00004.safetensors", "model.blocks.19.att.receptance.weight": "model-00002-of-00004.safetensors", "model.blocks.19.att.value.weight": "model-00002-of-00004.safetensors", "model.blocks.19.ffn.key.weight": "model-00002-of-00004.safetensors", "model.blocks.19.ffn.receptance.weight": "model-00002-of-00004.safetensors", "model.blocks.19.ffn.value.weight": "model-00002-of-00004.safetensors", "model.blocks.2.att.gate.weight": "model-00002-of-00004.safetensors", "model.blocks.2.att.key.weight": "model-00002-of-00004.safetensors", "model.blocks.2.att.output.weight": "model-00002-of-00004.safetensors", "model.blocks.2.att.receptance.weight": "model-00002-of-00004.safetensors", "model.blocks.2.att.value.weight": "model-00002-of-00004.safetensors", "model.blocks.2.ffn.key.weight": "model-00002-of-00004.safetensors", "model.blocks.2.ffn.receptance.weight": "model-00002-of-00004.safetensors", "model.blocks.2.ffn.value.weight": "model-00002-of-00004.safetensors", "model.blocks.20.att.gate.weight": "model-00002-of-00004.safetensors", "model.blocks.20.att.key.weight": "model-00002-of-00004.safetensors", "model.blocks.20.att.output.weight": "model-00002-of-00004.safetensors", "model.blocks.20.att.receptance.weight": "model-00002-of-00004.safetensors", "model.blocks.20.att.value.weight": "model-00002-of-00004.safetensors", "model.blocks.20.ffn.key.weight": "model-00002-of-00004.safetensors", "model.blocks.20.ffn.receptance.weight": "model-00002-of-00004.safetensors", "model.blocks.20.ffn.value.weight": "model-00002-of-00004.safetensors", "model.blocks.21.att.gate.weight": "model-00002-of-00004.safetensors", "model.blocks.21.att.key.weight": "model-00002-of-00004.safetensors", "model.blocks.21.att.output.weight": "model-00002-of-00004.safetensors", "model.blocks.21.att.receptance.weight": "model-00002-of-00004.safetensors", "model.blocks.21.att.value.weight": "model-00002-of-00004.safetensors", "model.blocks.21.ffn.key.weight": "model-00002-of-00004.safetensors", "model.blocks.21.ffn.receptance.weight": "model-00002-of-00004.safetensors", "model.blocks.21.ffn.value.weight": "model-00002-of-00004.safetensors", "model.blocks.22.att.gate.weight": "model-00002-of-00004.safetensors", "model.blocks.22.att.key.weight": "model-00002-of-00004.safetensors", "model.blocks.22.att.output.weight": "model-00002-of-00004.safetensors", "model.blocks.22.att.receptance.weight": "model-00002-of-00004.safetensors", "model.blocks.22.att.value.weight": "model-00002-of-00004.safetensors", "model.blocks.22.ffn.key.weight": "model-00002-of-00004.safetensors", "model.blocks.22.ffn.receptance.weight": "model-00002-of-00004.safetensors", "model.blocks.22.ffn.value.weight": "model-00002-of-00004.safetensors", "model.blocks.23.att.gate.weight": "model-00002-of-00004.safetensors", "model.blocks.23.att.key.weight": "model-00002-of-00004.safetensors", "model.blocks.23.att.output.weight": "model-00002-of-00004.safetensors", "model.blocks.23.att.receptance.weight": "model-00002-of-00004.safetensors", "model.blocks.23.att.value.weight": "model-00002-of-00004.safetensors", "model.blocks.23.ffn.key.weight": "model-00002-of-00004.safetensors", "model.blocks.23.ffn.receptance.weight": "model-00002-of-00004.safetensors", "model.blocks.23.ffn.value.weight": "model-00002-of-00004.safetensors", "model.blocks.24.att.gate.weight": "model-00002-of-00004.safetensors", "model.blocks.24.att.key.weight": "model-00002-of-00004.safetensors", "model.blocks.24.att.output.weight": "model-00002-of-00004.safetensors", "model.blocks.24.att.receptance.weight": "model-00002-of-00004.safetensors", "model.blocks.24.att.value.weight": "model-00002-of-00004.safetensors", "model.blocks.24.ffn.key.weight": "model-00002-of-00004.safetensors", "model.blocks.24.ffn.receptance.weight": "model-00002-of-00004.safetensors", "model.blocks.24.ffn.value.weight": "model-00002-of-00004.safetensors", "model.blocks.25.att.gate.weight": "model-00002-of-00004.safetensors", "model.blocks.25.att.key.weight": "model-00002-of-00004.safetensors", "model.blocks.25.att.output.weight": "model-00002-of-00004.safetensors", "model.blocks.25.att.receptance.weight": "model-00002-of-00004.safetensors", "model.blocks.25.att.value.weight": "model-00002-of-00004.safetensors", "model.blocks.25.ffn.key.weight": "model-00002-of-00004.safetensors", "model.blocks.25.ffn.receptance.weight": "model-00002-of-00004.safetensors", "model.blocks.25.ffn.value.weight": "model-00002-of-00004.safetensors", "model.blocks.26.att.gate.weight": "model-00002-of-00004.safetensors", "model.blocks.26.att.key.weight": "model-00002-of-00004.safetensors", "model.blocks.26.att.output.weight": "model-00002-of-00004.safetensors", "model.blocks.26.att.receptance.weight": "model-00002-of-00004.safetensors", "model.blocks.26.att.value.weight": "model-00002-of-00004.safetensors", "model.blocks.26.ffn.key.weight": "model-00003-of-00004.safetensors", "model.blocks.26.ffn.receptance.weight": "model-00003-of-00004.safetensors", "model.blocks.26.ffn.value.weight": "model-00003-of-00004.safetensors", "model.blocks.27.att.gate.weight": "model-00003-of-00004.safetensors", "model.blocks.27.att.key.weight": "model-00003-of-00004.safetensors", "model.blocks.27.att.output.weight": "model-00003-of-00004.safetensors", "model.blocks.27.att.receptance.weight": "model-00003-of-00004.safetensors", "model.blocks.27.att.value.weight": "model-00003-of-00004.safetensors", "model.blocks.27.ffn.key.weight": "model-00003-of-00004.safetensors", "model.blocks.27.ffn.receptance.weight": "model-00003-of-00004.safetensors", "model.blocks.27.ffn.value.weight": "model-00003-of-00004.safetensors", "model.blocks.28.att.gate.weight": "model-00003-of-00004.safetensors", "model.blocks.28.att.key.weight": "model-00003-of-00004.safetensors", "model.blocks.28.att.output.weight": "model-00003-of-00004.safetensors", "model.blocks.28.att.receptance.weight": "model-00003-of-00004.safetensors", "model.blocks.28.att.value.weight": "model-00003-of-00004.safetensors", "model.blocks.28.ffn.key.weight": "model-00003-of-00004.safetensors", "model.blocks.28.ffn.receptance.weight": "model-00003-of-00004.safetensors", "model.blocks.28.ffn.value.weight": "model-00003-of-00004.safetensors", "model.blocks.29.att.gate.weight": "model-00003-of-00004.safetensors", "model.blocks.29.att.key.weight": "model-00003-of-00004.safetensors", "model.blocks.29.att.output.weight": "model-00003-of-00004.safetensors", "model.blocks.29.att.receptance.weight": "model-00003-of-00004.safetensors", "model.blocks.29.att.value.weight": "model-00003-of-00004.safetensors", "model.blocks.29.ffn.key.weight": "model-00003-of-00004.safetensors", "model.blocks.29.ffn.receptance.weight": "model-00003-of-00004.safetensors", "model.blocks.29.ffn.value.weight": "model-00003-of-00004.safetensors", "model.blocks.3.att.gate.weight": "model-00003-of-00004.safetensors", "model.blocks.3.att.key.weight": "model-00003-of-00004.safetensors", "model.blocks.3.att.output.weight": "model-00003-of-00004.safetensors", "model.blocks.3.att.receptance.weight": "model-00003-of-00004.safetensors", "model.blocks.3.att.value.weight": "model-00003-of-00004.safetensors", "model.blocks.3.ffn.key.weight": "model-00003-of-00004.safetensors", "model.blocks.3.ffn.receptance.weight": "model-00003-of-00004.safetensors", "model.blocks.3.ffn.value.weight": "model-00003-of-00004.safetensors", "model.blocks.30.att.gate.weight": "model-00003-of-00004.safetensors", "model.blocks.30.att.key.weight": "model-00003-of-00004.safetensors", "model.blocks.30.att.output.weight": "model-00003-of-00004.safetensors", "model.blocks.30.att.receptance.weight": "model-00003-of-00004.safetensors", "model.blocks.30.att.value.weight": "model-00003-of-00004.safetensors", "model.blocks.30.ffn.key.weight": "model-00003-of-00004.safetensors", "model.blocks.30.ffn.receptance.weight": "model-00003-of-00004.safetensors", "model.blocks.30.ffn.value.weight": "model-00003-of-00004.safetensors", "model.blocks.31.att.gate.weight": "model-00003-of-00004.safetensors", "model.blocks.31.att.key.weight": "model-00003-of-00004.safetensors", "model.blocks.31.att.output.weight": "model-00003-of-00004.safetensors", "model.blocks.31.att.receptance.weight": "model-00003-of-00004.safetensors", "model.blocks.31.att.value.weight": "model-00003-of-00004.safetensors", "model.blocks.31.ffn.key.weight": "model-00003-of-00004.safetensors", "model.blocks.31.ffn.receptance.weight": "model-00003-of-00004.safetensors", "model.blocks.31.ffn.value.weight": "model-00003-of-00004.safetensors", "model.blocks.4.att.gate.weight": "model-00003-of-00004.safetensors", "model.blocks.4.att.key.weight": "model-00003-of-00004.safetensors", "model.blocks.4.att.output.weight": "model-00003-of-00004.safetensors", "model.blocks.4.att.receptance.weight": "model-00003-of-00004.safetensors", "model.blocks.4.att.value.weight": "model-00003-of-00004.safetensors", "model.blocks.4.ffn.key.weight": "model-00003-of-00004.safetensors", "model.blocks.4.ffn.receptance.weight": "model-00003-of-00004.safetensors", "model.blocks.4.ffn.value.weight": "model-00003-of-00004.safetensors", "model.blocks.5.att.gate.weight": "model-00003-of-00004.safetensors", "model.blocks.5.att.key.weight": "model-00003-of-00004.safetensors", "model.blocks.5.att.output.weight": "model-00003-of-00004.safetensors", "model.blocks.5.att.receptance.weight": "model-00003-of-00004.safetensors", "model.blocks.5.att.value.weight": "model-00003-of-00004.safetensors", "model.blocks.5.ffn.key.weight": "model-00003-of-00004.safetensors", "model.blocks.5.ffn.receptance.weight": "model-00003-of-00004.safetensors", "model.blocks.5.ffn.value.weight": "model-00003-of-00004.safetensors", "model.blocks.6.att.gate.weight": "model-00003-of-00004.safetensors", "model.blocks.6.att.key.weight": "model-00003-of-00004.safetensors", "model.blocks.6.att.output.weight": "model-00003-of-00004.safetensors", "model.blocks.6.att.receptance.weight": "model-00003-of-00004.safetensors", "model.blocks.6.att.value.weight": "model-00003-of-00004.safetensors", "model.blocks.6.ffn.key.weight": "model-00003-of-00004.safetensors", "model.blocks.6.ffn.receptance.weight": "model-00003-of-00004.safetensors", "model.blocks.6.ffn.value.weight": "model-00003-of-00004.safetensors", "model.blocks.7.att.gate.weight": "model-00003-of-00004.safetensors", "model.blocks.7.att.key.weight": "model-00003-of-00004.safetensors", "model.blocks.7.att.output.weight": "model-00003-of-00004.safetensors", "model.blocks.7.att.receptance.weight": "model-00004-of-00004.safetensors", "model.blocks.7.att.value.weight": "model-00004-of-00004.safetensors", "model.blocks.7.ffn.key.weight": "model-00004-of-00004.safetensors", "model.blocks.7.ffn.receptance.weight": "model-00004-of-00004.safetensors", "model.blocks.7.ffn.value.weight": "model-00004-of-00004.safetensors", "model.blocks.8.att.gate.weight": "model-00004-of-00004.safetensors", "model.blocks.8.att.key.weight": "model-00004-of-00004.safetensors", "model.blocks.8.att.output.weight": "model-00004-of-00004.safetensors", "model.blocks.8.att.receptance.weight": "model-00004-of-00004.safetensors", "model.blocks.8.att.value.weight": "model-00004-of-00004.safetensors", "model.blocks.8.ffn.key.weight": "model-00004-of-00004.safetensors", "model.blocks.8.ffn.receptance.weight": "model-00004-of-00004.safetensors", "model.blocks.8.ffn.value.weight": "model-00004-of-00004.safetensors", "model.blocks.9.att.gate.weight": "model-00004-of-00004.safetensors", "model.blocks.9.att.key.weight": "model-00004-of-00004.safetensors", "model.blocks.9.att.output.weight": "model-00004-of-00004.safetensors", "model.blocks.9.att.receptance.weight": "model-00004-of-00004.safetensors", "model.blocks.9.att.value.weight": "model-00004-of-00004.safetensors", "model.blocks.9.ffn.key.weight": "model-00004-of-00004.safetensors", "model.blocks.9.ffn.receptance.weight": "model-00004-of-00004.safetensors", "model.blocks.9.ffn.value.weight": "model-00004-of-00004.safetensors", "model.emb.weight": "model-00004-of-00004.safetensors", "model.head.weight": "model-00004-of-00004.safetensors"}}