apepkuss79 commited on
Commit
204a5b5
·
verified ·
1 Parent(s): ccbe474

Update models

Browse files
.gitattributes CHANGED
@@ -33,3 +33,16 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ DeepSeek-R1-Distill-Qwen-7B-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text
37
+ DeepSeek-R1-Distill-Qwen-7B-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text
38
+ DeepSeek-R1-Distill-Qwen-7B-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text
39
+ DeepSeek-R1-Distill-Qwen-7B-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text
40
+ DeepSeek-R1-Distill-Qwen-7B-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text
41
+ DeepSeek-R1-Distill-Qwen-7B-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text
42
+ DeepSeek-R1-Distill-Qwen-7B-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text
43
+ DeepSeek-R1-Distill-Qwen-7B-Q5_0.gguf filter=lfs diff=lfs merge=lfs -text
44
+ DeepSeek-R1-Distill-Qwen-7B-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text
45
+ DeepSeek-R1-Distill-Qwen-7B-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text
46
+ DeepSeek-R1-Distill-Qwen-7B-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text
47
+ DeepSeek-R1-Distill-Qwen-7B-Q8_0.gguf filter=lfs diff=lfs merge=lfs -text
48
+ DeepSeek-R1-Distill-Qwen-7B-f16.gguf filter=lfs diff=lfs merge=lfs -text
DeepSeek-R1-Distill-Qwen-7B-Q2_K.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:def5f628be356d6d4c92913c4ab227d34972e79398e4c304988d28f4e70213af
3
+ size 3015939776
DeepSeek-R1-Distill-Qwen-7B-Q3_K_L.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9cc64f6812c551f85ba7a0a0de222337223df4d424b377ae4f2297209d860a34
3
+ size 4088458944
DeepSeek-R1-Distill-Qwen-7B-Q3_K_M.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7cd1331f4087879c4bc2a0443526ea8a97d807abe1654328f68629ff426c9bae
3
+ size 3808390848
DeepSeek-R1-Distill-Qwen-7B-Q3_K_S.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:54cda95194bfcaef6176e508fc0c1a92af368bf6d30049da2f65634f6c372b2b
3
+ size 3492368064
DeepSeek-R1-Distill-Qwen-7B-Q4_0.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:50f1ec848ae1c65578105d1ef880a291390edc0c6d07c7ec1734a9f753d65ad9
3
+ size 4431390400
DeepSeek-R1-Distill-Qwen-7B-Q4_K_M.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9eda5f18e3b32782f053c4baefa363a96b390cbab6f9fe643d9cec478898b36a
3
+ size 4683073216
DeepSeek-R1-Distill-Qwen-7B-Q4_K_S.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5c251f553b060c206c9b0bde01253c08bdb78e84b5b213f7d1dac41f2a927ef5
3
+ size 4457768640
DeepSeek-R1-Distill-Qwen-7B-Q5_0.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:11585d590f930de302009d65675c8a30ce0f27be6f1878a78ffa1b5429ef8228
3
+ size 5315176128
DeepSeek-R1-Distill-Qwen-7B-Q5_K_M.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0366f3aed111846266153192edcd90dfcd39ae374f6d07fa243c8acc46041f16
3
+ size 5444830912
DeepSeek-R1-Distill-Qwen-7B-Q5_K_S.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab3f7a9efcc79055542c51418960aa3fdaf4ca11dd17ea2ba2fafdbae724f062
3
+ size 5315176128
DeepSeek-R1-Distill-Qwen-7B-Q6_K.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a1f9c8008ed93e268f9f635e51726e6ce58ff4f861724903b1fb61ff25aab1ab
3
+ size 6254198464
DeepSeek-R1-Distill-Qwen-7B-Q8_0.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cf965fadac9d87c26a2d102ec90c45439c0c8a8c0c1f23f2e72c461014df8b9c
3
+ size 8098524864
DeepSeek-R1-Distill-Qwen-7B-f16.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3800f07f3ca5a96897aaf46892105cb03bc9f8a29b1cdf20122beb0cd018815
3
+ size 15237852864
config.json ADDED
@@ -0,0 +1,28 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "Qwen2ForCausalLM"
4
+ ],
5
+ "attention_dropout": 0.0,
6
+ "bos_token_id": 151643,
7
+ "eos_token_id": 151643,
8
+ "hidden_act": "silu",
9
+ "hidden_size": 3584,
10
+ "initializer_range": 0.02,
11
+ "intermediate_size": 18944,
12
+ "max_position_embeddings": 131072,
13
+ "max_window_layers": 28,
14
+ "model_type": "qwen2",
15
+ "num_attention_heads": 28,
16
+ "num_hidden_layers": 28,
17
+ "num_key_value_heads": 4,
18
+ "rms_norm_eps": 1e-06,
19
+ "rope_theta": 10000,
20
+ "sliding_window": 4096,
21
+ "tie_word_embeddings": false,
22
+ "torch_dtype": "bfloat16",
23
+ "transformers_version": "4.44.0",
24
+ "use_cache": true,
25
+ "use_mrope": false,
26
+ "use_sliding_window": false,
27
+ "vocab_size": 152064
28
+ }