Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- config.json +35 -0
- generation_config.json +9 -0
- pytorch_model-00001-of-00191.bin +3 -0
- pytorch_model-00002-of-00191.bin +3 -0
- pytorch_model-00003-of-00191.bin +3 -0
- pytorch_model-00004-of-00191.bin +3 -0
- pytorch_model-00005-of-00191.bin +3 -0
- pytorch_model-00006-of-00191.bin +3 -0
- pytorch_model-00007-of-00191.bin +3 -0
- pytorch_model-00008-of-00191.bin +3 -0
- pytorch_model-00009-of-00191.bin +3 -0
- pytorch_model-00010-of-00191.bin +3 -0
- pytorch_model-00011-of-00191.bin +3 -0
- pytorch_model-00012-of-00191.bin +3 -0
- pytorch_model-00013-of-00191.bin +3 -0
- pytorch_model-00014-of-00191.bin +3 -0
- pytorch_model-00015-of-00191.bin +3 -0
- pytorch_model-00016-of-00191.bin +3 -0
- pytorch_model-00017-of-00191.bin +3 -0
- pytorch_model-00018-of-00191.bin +3 -0
- pytorch_model-00019-of-00191.bin +3 -0
- pytorch_model-00020-of-00191.bin +3 -0
- pytorch_model-00021-of-00191.bin +3 -0
- pytorch_model-00022-of-00191.bin +3 -0
- pytorch_model-00023-of-00191.bin +3 -0
- pytorch_model-00024-of-00191.bin +3 -0
- pytorch_model-00025-of-00191.bin +3 -0
- pytorch_model-00026-of-00191.bin +3 -0
- pytorch_model-00027-of-00191.bin +3 -0
- pytorch_model-00028-of-00191.bin +3 -0
- pytorch_model-00029-of-00191.bin +3 -0
- pytorch_model-00030-of-00191.bin +3 -0
- pytorch_model-00031-of-00191.bin +3 -0
- pytorch_model-00032-of-00191.bin +3 -0
- pytorch_model-00033-of-00191.bin +3 -0
- pytorch_model-00034-of-00191.bin +3 -0
- pytorch_model-00035-of-00191.bin +3 -0
- pytorch_model-00036-of-00191.bin +3 -0
- pytorch_model-00037-of-00191.bin +3 -0
- pytorch_model-00038-of-00191.bin +3 -0
- pytorch_model-00039-of-00191.bin +3 -0
- pytorch_model-00040-of-00191.bin +3 -0
- pytorch_model-00041-of-00191.bin +3 -0
- pytorch_model-00042-of-00191.bin +3 -0
- pytorch_model-00043-of-00191.bin +3 -0
- pytorch_model-00044-of-00191.bin +3 -0
- pytorch_model-00045-of-00191.bin +3 -0
- pytorch_model-00046-of-00191.bin +3 -0
- pytorch_model-00047-of-00191.bin +3 -0
- pytorch_model-00048-of-00191.bin +3 -0
config.json
ADDED
@@ -0,0 +1,35 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "/workspace/Meta-Llama-3.1-405B",
|
3 |
+
"architectures": [
|
4 |
+
"LlamaForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_bias": false,
|
7 |
+
"attention_dropout": 0.0,
|
8 |
+
"bos_token_id": 128000,
|
9 |
+
"eos_token_id": 128001,
|
10 |
+
"hidden_act": "silu",
|
11 |
+
"hidden_size": 16384,
|
12 |
+
"initializer_range": 0.02,
|
13 |
+
"intermediate_size": 53248,
|
14 |
+
"max_position_embeddings": 131072,
|
15 |
+
"mlp_bias": false,
|
16 |
+
"model_type": "llama",
|
17 |
+
"num_attention_heads": 128,
|
18 |
+
"num_hidden_layers": 126,
|
19 |
+
"num_key_value_heads": 8,
|
20 |
+
"pretraining_tp": 1,
|
21 |
+
"rms_norm_eps": 1e-05,
|
22 |
+
"rope_scaling": {
|
23 |
+
"factor": 8.0,
|
24 |
+
"high_freq_factor": 4.0,
|
25 |
+
"low_freq_factor": 1.0,
|
26 |
+
"original_max_position_embeddings": 8192,
|
27 |
+
"rope_type": "llama3"
|
28 |
+
},
|
29 |
+
"rope_theta": 500000.0,
|
30 |
+
"tie_word_embeddings": false,
|
31 |
+
"torch_dtype": "float16",
|
32 |
+
"transformers_version": "4.44.0",
|
33 |
+
"use_cache": false,
|
34 |
+
"vocab_size": 128256
|
35 |
+
}
|
generation_config.json
ADDED
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_from_model_config": true,
|
3 |
+
"bos_token_id": 128000,
|
4 |
+
"do_sample": true,
|
5 |
+
"eos_token_id": 128001,
|
6 |
+
"temperature": 0.6,
|
7 |
+
"top_p": 0.9,
|
8 |
+
"transformers_version": "4.44.0"
|
9 |
+
}
|
pytorch_model-00001-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2429626ccbaeab75582383d03dad1f22e56ea55a73fb6971549f673bd2094392
|
3 |
+
size 4806674800
|
pytorch_model-00002-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a229e1e2b9622eb78d46f7ba5a04e84eb0b610db9b42f02c7a943ca65da7063a
|
3 |
+
size 4026533863
|
pytorch_model-00003-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a9771e5298f1f476767e2bf5244757ebc4b5fe314a3a167eab1bf96dc9095dd4
|
3 |
+
size 4630580764
|
pytorch_model-00004-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5305214634ddf0a8db2a4845807fb1bcd63e5e30fa98406125939b2bc4084e1f
|
3 |
+
size 4630580764
|
pytorch_model-00005-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ff1162990b277e1900db7a0ca2c1b5ea185f222f97fbd6be11a08660410a9414
|
3 |
+
size 3489662678
|
pytorch_model-00006-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4cad85ae654663d8a4056796ee98de112dcf2a8f42e40b81344897479a7a0265
|
3 |
+
size 4630580764
|
pytorch_model-00007-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a1041636ab622aa3f7b61df9bc7e8f088c3af4368c5904abb286aa76faa667f3
|
3 |
+
size 4630580764
|
pytorch_model-00008-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c477537da2b3b23f1e2a6fc9638d2426db9ebe4dfd4d59d64ae152cac6cb07e6
|
3 |
+
size 3489662678
|
pytorch_model-00009-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7d93e6e0ee97550b7bd537035220bb35c60a16b0ff809bf13aada30c65550911
|
3 |
+
size 4630580764
|
pytorch_model-00010-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:24e12d46bf24605a8321ece0b3cfb7b72acc99a202411c2f275301372aaa5867
|
3 |
+
size 4630580764
|
pytorch_model-00011-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:54826fc6370355e6459a219d03a57dd1cd647a98bcf10f2fe2903416c2031755
|
3 |
+
size 3489662678
|
pytorch_model-00012-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:12603d8777448a0f9f0d500100039708f7b5fe059d5b0449906449e1d697578a
|
3 |
+
size 4630580764
|
pytorch_model-00013-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3b121191fb720282727f8aaa9f9c55b853f94cd36b7d37618eeac6c0da5d017a
|
3 |
+
size 4630580764
|
pytorch_model-00014-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:294f78309ee6d47e8a439dea6f7f4cd491bf664c57e493b1a2bf1135d6adbbd8
|
3 |
+
size 3489662678
|
pytorch_model-00015-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:41b66d02715eaa0e90a6199fd8e7ac86334b6dc1922f0c5c4edfdc4b05d9d787
|
3 |
+
size 4630580764
|
pytorch_model-00016-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7d16d7af78042c1512b6def2b94744976806aff884977c32edd792e0a71cef50
|
3 |
+
size 4630580764
|
pytorch_model-00017-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:46393a02d9e4f7e66dbd609696ee898ce3e5a2ee2db897101abcddb60c5bafa6
|
3 |
+
size 3489662678
|
pytorch_model-00018-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d30a425d71aff4a46f322bf9d366221c4acca7d3f7bd795e475490895b034923
|
3 |
+
size 4630580764
|
pytorch_model-00019-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:45e4e23a8de1bb99a129141610c2ff5aa2e8cf8702552dc4b4e6f10a90ea2345
|
3 |
+
size 4630580764
|
pytorch_model-00020-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0975d28e87f2f6df07d0db03f2d78b4d4065a2e61c9f65a7ada66b6253c8d69b
|
3 |
+
size 3489662678
|
pytorch_model-00021-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:be943dc6e6f6f19bbad29c2ee7ed051f189a2ce7afbe783722122b6f8d710915
|
3 |
+
size 4630580764
|
pytorch_model-00022-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d0ca3da4215441b011afa47a53ace365f8627da30ce046d557cd3edb7738f1f1
|
3 |
+
size 4630580764
|
pytorch_model-00023-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:70b41c12e524e0ca1a952958655727de27ac98e1c28024b406342cf3e145d733
|
3 |
+
size 3489662678
|
pytorch_model-00024-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:483790b936fd2db0bfeae162397eac6275daa80770ea346ec2790b50b3aa162f
|
3 |
+
size 4630580764
|
pytorch_model-00025-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2770892a357116d7715ba39cd15544f031bd707caf9650e2858e2981a57c214d
|
3 |
+
size 4630580764
|
pytorch_model-00026-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:313f8057731fc9903a0a8f18c25dac3f3eddd6eb0f5a240a4a7afcd59df114a4
|
3 |
+
size 3489662678
|
pytorch_model-00027-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4b8eb5ed4fde96e9ac9797937b68358ab64087e608ac9a6e9d50ac14bf2a0b3a
|
3 |
+
size 4630580764
|
pytorch_model-00028-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5e174fcb145156b66f68e7ce62a96171ec44759bc8e53a13da74686b90e1673a
|
3 |
+
size 4630580764
|
pytorch_model-00029-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4d4327df4e985f6435e70d53ea0d1ff9a8edafab8bed7666a20deff6371b826e
|
3 |
+
size 3489662678
|
pytorch_model-00030-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f902910716c750fc82e6aed4750872e0d6aa824058775633f92e26781755c1be
|
3 |
+
size 4630580764
|
pytorch_model-00031-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a28c84c2937f6959956f9147de64440f8c3fb867740498ab13e2ec6b4dc85e54
|
3 |
+
size 4630580764
|
pytorch_model-00032-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1705bc5ecce4a344fbc4ede18cf8b9804a4cdcf3c7d5bf528fae9558fc41d1c0
|
3 |
+
size 3489662678
|
pytorch_model-00033-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f167ce425f2dc4b2c1fdfb7e453f5501d13bc41a3f6c1a0c54e4bc3896d565b4
|
3 |
+
size 4630580764
|
pytorch_model-00034-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f7c2d1c9e0b802a9283caa87d008cc56a6fabb393dbc69abfa866a0493226c43
|
3 |
+
size 4630580764
|
pytorch_model-00035-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bbea72ad8a3e8baf10739f75d21e2604eed058d7091b538260a5b671f65f5489
|
3 |
+
size 3489662678
|
pytorch_model-00036-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:17c4b61c04a8c81226b7ae207ec035d5279cf8a97f41abc607a8997bdbf2933d
|
3 |
+
size 4630580764
|
pytorch_model-00037-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:45bf39b64c41286c0b3118bcf6ca8540099680cf1f9b07101bf47dcab7cb93c7
|
3 |
+
size 4630580764
|
pytorch_model-00038-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3e7eca3780521c6fabf9d47ef348038c00a1dab8588a90862fc731a54a056f5a
|
3 |
+
size 3489662678
|
pytorch_model-00039-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:14b5d0e9a5b379a4cd98aba00287a15fde04ffecfb34250e451508f209f88a65
|
3 |
+
size 4630580764
|
pytorch_model-00040-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7fde76bd3a0f410d99e8b4bac49fdd590cf7592bef89f675d0a9a2ce433a5ae7
|
3 |
+
size 4630580764
|
pytorch_model-00041-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c4e2b82bccaf8f7e828a02fe1fbace269204bd9500be9ebe36dc4f31a92ffd85
|
3 |
+
size 3489662678
|
pytorch_model-00042-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ca7afbe0f6cf8a2a5dde67d54937ce9a00365c70d9fea8f0eb8f36a1be0b43c5
|
3 |
+
size 4630580764
|
pytorch_model-00043-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:68d1c63ac606e9ee552653695227b29d19860bb75dd25ee7b0823b0567d00900
|
3 |
+
size 4630580764
|
pytorch_model-00044-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f6a12287ec0e74581a8fefdeba265a965d9d14f8d04418470d594646bf7ef52e
|
3 |
+
size 3489662678
|
pytorch_model-00045-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8daefab2033db26ca5035b7a45abc3230d16ee20a3f840098288e5c0c40d2cef
|
3 |
+
size 4630580764
|
pytorch_model-00046-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2785f3ddba318b1e7ef1d540627e64fbf937d0fed2436a80205def3e48e0464c
|
3 |
+
size 4630580764
|
pytorch_model-00047-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c2ba8e5f484eaf3d9af9e03e262c7168c15c7657ccb369eb96b6aeb27659e927
|
3 |
+
size 3489662678
|
pytorch_model-00048-of-00191.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6ff190703f56304c72a6534d83bcbbc1924cae23474494b3db0b710d4b985823
|
3 |
+
size 4630580764
|