quants upload
Browse filesLlama-3.1-Minitron-4B-Width-Base Q4_0_4_4 quant
- .gitattributes +1 -0
- Llama-3.1-Minitron-4B-Width-Base-Q4_0_4_4.gguf +3 -0
- README.md +12 -0
.gitattributes
CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
+
Llama-3.1-Minitron-4B-Width-Base-Q4_0_4_4.gguf filter=lfs diff=lfs merge=lfs -text
|
Llama-3.1-Minitron-4B-Width-Base-Q4_0_4_4.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6acecb42163a5ead82ca9494c86e494ed902cfdefe4b0a8b61fce85e7e643782
|
3 |
+
size 2648521376
|
README.md
ADDED
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
base_model: nvidia/Llama-3.1-Minitron-4B-Width-Base
|
3 |
+
license: other
|
4 |
+
license_name: nvidia-open-model-license
|
5 |
+
license_link: >-
|
6 |
+
https://developer.download.nvidia.com/licenses/nvidia-open-model-license-agreement-june-2024.pdf
|
7 |
+
inference: false
|
8 |
+
---
|
9 |
+
|
10 |
+
# Llama-3.1-Minitron-4B-Width-Base
|
11 |
+
|
12 |
+
ExLlamav2 8 bpw quant of https://huggingface.co/nvidia/Llama-3.1-Minitron-4B-Width-Base
|