mgoin commited on
Commit
5d13b1c
·
verified ·
1 Parent(s): d16c998

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. added_tokens.json +4 -0
  2. config.json +81 -0
  3. generation_config.json +8 -0
  4. merges.txt +0 -0
  5. model-00001-of-00061.safetensors +3 -0
  6. model-00002-of-00061.safetensors +3 -0
  7. model-00003-of-00061.safetensors +3 -0
  8. model-00004-of-00061.safetensors +3 -0
  9. model-00005-of-00061.safetensors +3 -0
  10. model-00006-of-00061.safetensors +3 -0
  11. model-00007-of-00061.safetensors +3 -0
  12. model-00008-of-00061.safetensors +3 -0
  13. model-00009-of-00061.safetensors +3 -0
  14. model-00010-of-00061.safetensors +3 -0
  15. model-00011-of-00061.safetensors +3 -0
  16. model-00012-of-00061.safetensors +3 -0
  17. model-00013-of-00061.safetensors +3 -0
  18. model-00014-of-00061.safetensors +3 -0
  19. model-00015-of-00061.safetensors +3 -0
  20. model-00016-of-00061.safetensors +3 -0
  21. model-00017-of-00061.safetensors +3 -0
  22. model-00018-of-00061.safetensors +3 -0
  23. model-00019-of-00061.safetensors +3 -0
  24. model-00020-of-00061.safetensors +3 -0
  25. model-00021-of-00061.safetensors +3 -0
  26. model-00022-of-00061.safetensors +3 -0
  27. model-00023-of-00061.safetensors +3 -0
  28. model-00024-of-00061.safetensors +3 -0
  29. model-00025-of-00061.safetensors +3 -0
  30. model-00026-of-00061.safetensors +3 -0
  31. model-00027-of-00061.safetensors +3 -0
  32. model-00028-of-00061.safetensors +3 -0
  33. model-00029-of-00061.safetensors +3 -0
  34. model-00030-of-00061.safetensors +3 -0
  35. model-00031-of-00061.safetensors +3 -0
  36. model-00032-of-00061.safetensors +3 -0
  37. model-00033-of-00061.safetensors +3 -0
  38. model-00034-of-00061.safetensors +3 -0
  39. model-00035-of-00061.safetensors +3 -0
  40. model-00036-of-00061.safetensors +3 -0
  41. model-00037-of-00061.safetensors +3 -0
  42. model-00038-of-00061.safetensors +3 -0
  43. model-00039-of-00061.safetensors +3 -0
  44. model-00040-of-00061.safetensors +3 -0
  45. model-00041-of-00061.safetensors +3 -0
  46. model-00042-of-00061.safetensors +3 -0
  47. model-00043-of-00061.safetensors +3 -0
  48. model-00044-of-00061.safetensors +3 -0
  49. model-00045-of-00061.safetensors +3 -0
  50. model-00046-of-00061.safetensors +3 -0
added_tokens.json ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ {
2
+ "<|im_end|>": 100279,
3
+ "<|im_start|>": 100278
4
+ }
config.json ADDED
@@ -0,0 +1,81 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "databricks/dbrx-instruct",
3
+ "architectures": [
4
+ "DbrxForCausalLM"
5
+ ],
6
+ "attn_config": {
7
+ "clip_qkv": 8,
8
+ "kv_n_heads": 8,
9
+ "model_type": "",
10
+ "rope_theta": 500000
11
+ },
12
+ "d_model": 6144,
13
+ "emb_pdrop": 0.0,
14
+ "ffn_config": {
15
+ "ffn_hidden_size": 10752,
16
+ "model_type": "",
17
+ "moe_jitter_eps": 0,
18
+ "moe_loss_weight": 0.05,
19
+ "moe_num_experts": 16,
20
+ "moe_top_k": 4
21
+ },
22
+ "initializer_range": 0.02,
23
+ "max_seq_len": 32768,
24
+ "model_type": "dbrx",
25
+ "n_heads": 48,
26
+ "n_layers": 40,
27
+ "output_router_logits": false,
28
+ "quantization_config": {
29
+ "activation_scheme": "static",
30
+ "ignored_layers": [
31
+ "transformer.blocks.26.ffn.router.layer",
32
+ "transformer.blocks.1.ffn.router.layer",
33
+ "transformer.blocks.32.ffn.router.layer",
34
+ "transformer.blocks.35.ffn.router.layer",
35
+ "transformer.blocks.16.ffn.router.layer",
36
+ "transformer.blocks.15.ffn.router.layer",
37
+ "transformer.blocks.10.ffn.router.layer",
38
+ "transformer.blocks.18.ffn.router.layer",
39
+ "transformer.blocks.34.ffn.router.layer",
40
+ "transformer.blocks.38.ffn.router.layer",
41
+ "transformer.blocks.13.ffn.router.layer",
42
+ "transformer.blocks.29.ffn.router.layer",
43
+ "transformer.blocks.3.ffn.router.layer",
44
+ "transformer.blocks.33.ffn.router.layer",
45
+ "transformer.blocks.21.ffn.router.layer",
46
+ "transformer.blocks.19.ffn.router.layer",
47
+ "transformer.blocks.8.ffn.router.layer",
48
+ "transformer.blocks.0.ffn.router.layer",
49
+ "transformer.blocks.37.ffn.router.layer",
50
+ "transformer.blocks.39.ffn.router.layer",
51
+ "transformer.blocks.4.ffn.router.layer",
52
+ "transformer.blocks.28.ffn.router.layer",
53
+ "transformer.blocks.7.ffn.router.layer",
54
+ "transformer.blocks.5.ffn.router.layer",
55
+ "transformer.blocks.9.ffn.router.layer",
56
+ "transformer.blocks.24.ffn.router.layer",
57
+ "transformer.blocks.25.ffn.router.layer",
58
+ "transformer.blocks.20.ffn.router.layer",
59
+ "transformer.blocks.27.ffn.router.layer",
60
+ "transformer.blocks.2.ffn.router.layer",
61
+ "transformer.blocks.31.ffn.router.layer",
62
+ "transformer.blocks.6.ffn.router.layer",
63
+ "transformer.blocks.30.ffn.router.layer",
64
+ "transformer.blocks.36.ffn.router.layer",
65
+ "transformer.blocks.12.ffn.router.layer",
66
+ "transformer.blocks.14.ffn.router.layer",
67
+ "transformer.blocks.23.ffn.router.layer",
68
+ "transformer.blocks.22.ffn.router.layer",
69
+ "transformer.blocks.11.ffn.router.layer",
70
+ "lm_head",
71
+ "transformer.blocks.17.ffn.router.layer"
72
+ ],
73
+ "quant_method": "fp8"
74
+ },
75
+ "resid_pdrop": 0.0,
76
+ "tie_word_embeddings": false,
77
+ "torch_dtype": "bfloat16",
78
+ "transformers_version": "4.42.1",
79
+ "use_cache": true,
80
+ "vocab_size": 100352
81
+ }
generation_config.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "eos_token_id": [
4
+ 100257,
5
+ 100279
6
+ ],
7
+ "transformers_version": "4.42.1"
8
+ }
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
model-00001-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9e8b15b783711ec62909b64fd67b83ecef4de9b6be4893f6af0c46f0c46b0ec9
3
+ size 3435357520
model-00002-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7464f3cf2dca00899cbb3314e8d17b9a122d265f745472218878c5c4353e6d6f
3
+ size 4316161376
model-00003-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eaf9bdd6896edda1c662ac7530a4053220d4a49da0c0361e90d8b7855141f251
3
+ size 4227858704
model-00004-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:31378090076d6aedb0d26fb257b3b18cb602dcbc0f727a2af48c34f8423fe7b8
3
+ size 4316161376
model-00005-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d52f5d01e62b1ff7f0639793ae82c521da62e335e7f5c5b02ef9f8352d8f3ab
3
+ size 4316161376
model-00006-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d06f6f69cc365df30371efea4514bca2bfc8a25ff31064d21e90995733f956b
3
+ size 4227858704
model-00007-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e251a1e5b0ae39108d718009179e63fb0a47bd6aeb498e6886d630d2143d1eb
3
+ size 4316161376
model-00008-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4c0f576c57592f9bb52cc3e6e8918551e07a86cadd0c84d65686ab1bf40d3e26
3
+ size 4316161376
model-00009-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:47f5395b27077df7f4bcc94ec9dbf870e8fd0bdef35764e10e43017dcc13424f
3
+ size 4227858704
model-00010-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:10cbdafcb67e0f147a1f2c0f1ff1e6620ad3c9bc6ae83d8ab0ff0982c21a2128
3
+ size 4316161376
model-00011-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4d212ec0a27345212b43e1480b9d7eade80636ffbe8b9cbba8ea5a782353f044
3
+ size 4316161376
model-00012-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d1e0086fafd04d58ea6a61b7e7660f6bbe54a0380a6fa1f39464ac8be440e7d8
3
+ size 4227858704
model-00013-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cec7de4e706f5bbc2761f8cc1b265cda119c2ab940bca30fe763807eef50c36d
3
+ size 4316161376
model-00014-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d935f89152887adfc8bf5f706028cfc64739a739327edad794fcf01c30e597c2
3
+ size 4316161376
model-00015-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a7d1cb9080dbf19ec925aff6beba736866ae505e334d5e852183468dc57188d0
3
+ size 4227858704
model-00016-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cadd10a61433dee6427a0009399d38bd0416cab796d0eca7d6285973308c46db
3
+ size 4316161384
model-00017-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:69b9f9e0d3cb3989eaffe295bc9f3559a8168e9846823408ca9fedf8c19c20c8
3
+ size 4316161384
model-00018-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:24f9e0a148c17ae3fef677ae94a8290a562bd6a31a805e76e23f91c2dbbd9f18
3
+ size 4227858712
model-00019-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d88c2076722a42c9261b14a7ef8f6e08737bba73f85ef9ba53c5f91c37c03979
3
+ size 4316161384
model-00020-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:72f7c767a98973251919e6bdeef15c3ee2f16d0767c29caba485ab36d8024501
3
+ size 4316161384
model-00021-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af7b81ca660ca1afde8b1a0f697724a788e7566214e7178492d0839e441819a4
3
+ size 4227858712
model-00022-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:30039fdc47d1c16b7aa1054183641a825121b6ad67a2c469d31f780f82068201
3
+ size 4316161384
model-00023-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec8716637d14e23712eb218f5758bd7eceb94cfeb5b2dd3235ababe2eb528fe7
3
+ size 4316161384
model-00024-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02350eeaa1d595bf65fc5c16c9ee3241f195fa0118d9dc9f983374b145bf35ea
3
+ size 4227858712
model-00025-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:104339642f4cee4f0ec67a8742bdba5462e64d9fa046dbf1fea5124711b7c04f
3
+ size 4316161384
model-00026-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:df93e04202bbb3cb179b493a8f7c240e44291bb800dc9426f9b75584469e6be0
3
+ size 4316161384
model-00027-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1db31da422deb6f7098c79dd18a3fab823fe8d6ae95dfcd751e7bc7fa1650def
3
+ size 4227858712
model-00028-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d19a879b30c1d146498c9559d83914deaed40d7f62acda21b1a437bcc96e2f88
3
+ size 4316161384
model-00029-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f0bf8905712028a61a7c8d9fe8bb8ed4520a605b0e3a417286ec59a8d6bac219
3
+ size 4316161384
model-00030-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:573a4ef61f3d9f1974f05612cc0299475c41f6a8d4e1ae530a0f21e8e6b04725
3
+ size 4227858712
model-00031-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c0c8d508ca682e3acd5df26816dbb4de4210ccb7ca767339aa2dfcf39fdd232f
3
+ size 4316161384
model-00032-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fc4b706d1273e6a1eb841c9fce993e9f9eb6b1b3a2c473f3174d4d8ca8c7f7e5
3
+ size 4316161384
model-00033-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d410b47d48eb572478b80a6ea1766da7ef7b5fdbb8e9e4e611208b2677cb81bd
3
+ size 4227858712
model-00034-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb31f0569a18273ee5701886f35cd14a924d1f3eb08504d755b957e9b4a29091
3
+ size 4316161384
model-00035-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0626e5e1c5ecd91c1209d5f13b8cbe76646a7601d5c9a02464fae5e080188ba5
3
+ size 4316161384
model-00036-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bc2d28e62edf58cf121924c4a57c172021a9dbe972d75cfdeb54180a1f21957b
3
+ size 4227858712
model-00037-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d6c8ae00611706f2a58ee27c07197ee8c38ac23e9e37b1900ae9d2824dde6a1b
3
+ size 4316161384
model-00038-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1f5df07bff32f527bdf879578ed3efa1781ca64e05245f679c6cf8c70ade8937
3
+ size 4316161384
model-00039-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d6b612cb8b81dc0714c0f7db73e0e9b4e14eb463e7069b16f5387bd2673890a
3
+ size 4227858712
model-00040-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:faeb5d54f25873f04fcdd2359ce98b90ef9622af4b7fc56308c32b8253b7e9ed
3
+ size 4316161384
model-00041-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:30a2a7f1c902a90c1eb9bece8eec7fd42793a96017dac7e2a923369375a5421c
3
+ size 4316161384
model-00042-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:128e0433397f8e992cd174ea9b2931af49e25feeb78aef9c6cd5335da6e86e82
3
+ size 4227858712
model-00043-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f9afb67300bfdfff496ddb766fcb454b497b7e83920f45eb2fbd4c2ea83b8f6
3
+ size 4316161384
model-00044-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f0488d9b6d8dbf69572a28fb997bc5b63b7d35dc2797d79b3a1968e3e426cac
3
+ size 4316161384
model-00045-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f8796101e5df9c327e6bcc376ffaba33191270a966be67cfa9d75ef1dbac695
3
+ size 4227858712
model-00046-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:baeb4128e8001e0211c8366ba5b2092c5bb17245325e8f580833596abf048615
3
+ size 4316161384