altomek commited on
Commit
0fd3066
1 Parent(s): 4e78cd6

quants upload

Browse files

Llama-3.1-Minitron-4B-Width-Base Q4_0_4_4 quant

.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ Llama-3.1-Minitron-4B-Width-Base-Q4_0_4_4.gguf filter=lfs diff=lfs merge=lfs -text
Llama-3.1-Minitron-4B-Width-Base-Q4_0_4_4.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6acecb42163a5ead82ca9494c86e494ed902cfdefe4b0a8b61fce85e7e643782
3
+ size 2648521376
README.md ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ base_model: nvidia/Llama-3.1-Minitron-4B-Width-Base
3
+ license: other
4
+ license_name: nvidia-open-model-license
5
+ license_link: >-
6
+ https://developer.download.nvidia.com/licenses/nvidia-open-model-license-agreement-june-2024.pdf
7
+ inference: false
8
+ ---
9
+
10
+ # Llama-3.1-Minitron-4B-Width-Base
11
+
12
+ ExLlamav2 8 bpw quant of https://huggingface.co/nvidia/Llama-3.1-Minitron-4B-Width-Base