Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes. See raw diff
- .gitattributes +104 -0
- README.md +47 -0
- featherless-quants.png +3 -0
- nvidia-Llama3-ChatQA-1.5-70B-IQ4_XS/nvidia-Llama3-ChatQA-1.5-70B-IQ4_XS-00001-of-00008.gguf +3 -0
- nvidia-Llama3-ChatQA-1.5-70B-IQ4_XS/nvidia-Llama3-ChatQA-1.5-70B-IQ4_XS-00002-of-00008.gguf +3 -0
- nvidia-Llama3-ChatQA-1.5-70B-IQ4_XS/nvidia-Llama3-ChatQA-1.5-70B-IQ4_XS-00003-of-00008.gguf +3 -0
- nvidia-Llama3-ChatQA-1.5-70B-IQ4_XS/nvidia-Llama3-ChatQA-1.5-70B-IQ4_XS-00004-of-00008.gguf +3 -0
- nvidia-Llama3-ChatQA-1.5-70B-IQ4_XS/nvidia-Llama3-ChatQA-1.5-70B-IQ4_XS-00005-of-00008.gguf +3 -0
- nvidia-Llama3-ChatQA-1.5-70B-IQ4_XS/nvidia-Llama3-ChatQA-1.5-70B-IQ4_XS-00006-of-00008.gguf +3 -0
- nvidia-Llama3-ChatQA-1.5-70B-IQ4_XS/nvidia-Llama3-ChatQA-1.5-70B-IQ4_XS-00007-of-00008.gguf +3 -0
- nvidia-Llama3-ChatQA-1.5-70B-IQ4_XS/nvidia-Llama3-ChatQA-1.5-70B-IQ4_XS-00008-of-00008.gguf +3 -0
- nvidia-Llama3-ChatQA-1.5-70B-Q2_K/nvidia-Llama3-ChatQA-1.5-70B-Q2_K-00001-of-00006.gguf +3 -0
- nvidia-Llama3-ChatQA-1.5-70B-Q2_K/nvidia-Llama3-ChatQA-1.5-70B-Q2_K-00002-of-00006.gguf +3 -0
- nvidia-Llama3-ChatQA-1.5-70B-Q2_K/nvidia-Llama3-ChatQA-1.5-70B-Q2_K-00003-of-00006.gguf +3 -0
- nvidia-Llama3-ChatQA-1.5-70B-Q2_K/nvidia-Llama3-ChatQA-1.5-70B-Q2_K-00004-of-00006.gguf +3 -0
- nvidia-Llama3-ChatQA-1.5-70B-Q2_K/nvidia-Llama3-ChatQA-1.5-70B-Q2_K-00005-of-00006.gguf +3 -0
- nvidia-Llama3-ChatQA-1.5-70B-Q2_K/nvidia-Llama3-ChatQA-1.5-70B-Q2_K-00006-of-00006.gguf +3 -0
- nvidia-Llama3-ChatQA-1.5-70B-Q3_K_L/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_L-00001-of-00008.gguf +3 -0
- nvidia-Llama3-ChatQA-1.5-70B-Q3_K_L/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_L-00002-of-00008.gguf +3 -0
- nvidia-Llama3-ChatQA-1.5-70B-Q3_K_L/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_L-00003-of-00008.gguf +3 -0
- nvidia-Llama3-ChatQA-1.5-70B-Q3_K_L/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_L-00004-of-00008.gguf +3 -0
- nvidia-Llama3-ChatQA-1.5-70B-Q3_K_L/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_L-00005-of-00008.gguf +3 -0
- nvidia-Llama3-ChatQA-1.5-70B-Q3_K_L/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_L-00006-of-00008.gguf +3 -0
- nvidia-Llama3-ChatQA-1.5-70B-Q3_K_L/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_L-00007-of-00008.gguf +3 -0
- nvidia-Llama3-ChatQA-1.5-70B-Q3_K_L/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_L-00008-of-00008.gguf +3 -0
- nvidia-Llama3-ChatQA-1.5-70B-Q3_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_M-00001-of-00007.gguf +3 -0
- nvidia-Llama3-ChatQA-1.5-70B-Q3_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_M-00002-of-00007.gguf +3 -0
- nvidia-Llama3-ChatQA-1.5-70B-Q3_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_M-00003-of-00007.gguf +3 -0
- nvidia-Llama3-ChatQA-1.5-70B-Q3_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_M-00004-of-00007.gguf +3 -0
- nvidia-Llama3-ChatQA-1.5-70B-Q3_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_M-00005-of-00007.gguf +3 -0
- nvidia-Llama3-ChatQA-1.5-70B-Q3_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_M-00006-of-00007.gguf +3 -0
- nvidia-Llama3-ChatQA-1.5-70B-Q3_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_M-00007-of-00007.gguf +3 -0
- nvidia-Llama3-ChatQA-1.5-70B-Q3_K_S/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_S-00001-of-00007.gguf +3 -0
- nvidia-Llama3-ChatQA-1.5-70B-Q3_K_S/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_S-00002-of-00007.gguf +3 -0
- nvidia-Llama3-ChatQA-1.5-70B-Q3_K_S/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_S-00003-of-00007.gguf +3 -0
- nvidia-Llama3-ChatQA-1.5-70B-Q3_K_S/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_S-00004-of-00007.gguf +3 -0
- nvidia-Llama3-ChatQA-1.5-70B-Q3_K_S/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_S-00005-of-00007.gguf +3 -0
- nvidia-Llama3-ChatQA-1.5-70B-Q3_K_S/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_S-00006-of-00007.gguf +3 -0
- nvidia-Llama3-ChatQA-1.5-70B-Q3_K_S/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_S-00007-of-00007.gguf +3 -0
- nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M-00001-of-00009.gguf +3 -0
- nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M-00002-of-00009.gguf +3 -0
- nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M-00003-of-00009.gguf +3 -0
- nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M-00004-of-00009.gguf +3 -0
- nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M-00005-of-00009.gguf +3 -0
- nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M-00006-of-00009.gguf +3 -0
- nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M-00007-of-00009.gguf +3 -0
- nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M-00008-of-00009.gguf +3 -0
- nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M-00009-of-00009.gguf +3 -0
- nvidia-Llama3-ChatQA-1.5-70B-Q4_K_S/nvidia-Llama3-ChatQA-1.5-70B-Q4_K_S-00001-of-00009.gguf +3 -0
- nvidia-Llama3-ChatQA-1.5-70B-Q4_K_S/nvidia-Llama3-ChatQA-1.5-70B-Q4_K_S-00002-of-00009.gguf +3 -0
.gitattributes
CHANGED
|
@@ -33,3 +33,107 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
+
featherless-quants.png filter=lfs diff=lfs merge=lfs -text
|
| 37 |
+
nvidia-Llama3-ChatQA-1.5-70B-IQ4_XS/nvidia-Llama3-ChatQA-1.5-70B-IQ4_XS-00001-of-00008.gguf filter=lfs diff=lfs merge=lfs -text
|
| 38 |
+
nvidia-Llama3-ChatQA-1.5-70B-IQ4_XS/nvidia-Llama3-ChatQA-1.5-70B-IQ4_XS-00002-of-00008.gguf filter=lfs diff=lfs merge=lfs -text
|
| 39 |
+
nvidia-Llama3-ChatQA-1.5-70B-IQ4_XS/nvidia-Llama3-ChatQA-1.5-70B-IQ4_XS-00003-of-00008.gguf filter=lfs diff=lfs merge=lfs -text
|
| 40 |
+
nvidia-Llama3-ChatQA-1.5-70B-IQ4_XS/nvidia-Llama3-ChatQA-1.5-70B-IQ4_XS-00004-of-00008.gguf filter=lfs diff=lfs merge=lfs -text
|
| 41 |
+
nvidia-Llama3-ChatQA-1.5-70B-IQ4_XS/nvidia-Llama3-ChatQA-1.5-70B-IQ4_XS-00005-of-00008.gguf filter=lfs diff=lfs merge=lfs -text
|
| 42 |
+
nvidia-Llama3-ChatQA-1.5-70B-IQ4_XS/nvidia-Llama3-ChatQA-1.5-70B-IQ4_XS-00006-of-00008.gguf filter=lfs diff=lfs merge=lfs -text
|
| 43 |
+
nvidia-Llama3-ChatQA-1.5-70B-IQ4_XS/nvidia-Llama3-ChatQA-1.5-70B-IQ4_XS-00007-of-00008.gguf filter=lfs diff=lfs merge=lfs -text
|
| 44 |
+
nvidia-Llama3-ChatQA-1.5-70B-IQ4_XS/nvidia-Llama3-ChatQA-1.5-70B-IQ4_XS-00008-of-00008.gguf filter=lfs diff=lfs merge=lfs -text
|
| 45 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q2_K/nvidia-Llama3-ChatQA-1.5-70B-Q2_K-00001-of-00006.gguf filter=lfs diff=lfs merge=lfs -text
|
| 46 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q2_K/nvidia-Llama3-ChatQA-1.5-70B-Q2_K-00002-of-00006.gguf filter=lfs diff=lfs merge=lfs -text
|
| 47 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q2_K/nvidia-Llama3-ChatQA-1.5-70B-Q2_K-00003-of-00006.gguf filter=lfs diff=lfs merge=lfs -text
|
| 48 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q2_K/nvidia-Llama3-ChatQA-1.5-70B-Q2_K-00004-of-00006.gguf filter=lfs diff=lfs merge=lfs -text
|
| 49 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q2_K/nvidia-Llama3-ChatQA-1.5-70B-Q2_K-00005-of-00006.gguf filter=lfs diff=lfs merge=lfs -text
|
| 50 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q2_K/nvidia-Llama3-ChatQA-1.5-70B-Q2_K-00006-of-00006.gguf filter=lfs diff=lfs merge=lfs -text
|
| 51 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q3_K_L/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_L-00001-of-00008.gguf filter=lfs diff=lfs merge=lfs -text
|
| 52 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q3_K_L/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_L-00002-of-00008.gguf filter=lfs diff=lfs merge=lfs -text
|
| 53 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q3_K_L/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_L-00003-of-00008.gguf filter=lfs diff=lfs merge=lfs -text
|
| 54 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q3_K_L/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_L-00004-of-00008.gguf filter=lfs diff=lfs merge=lfs -text
|
| 55 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q3_K_L/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_L-00005-of-00008.gguf filter=lfs diff=lfs merge=lfs -text
|
| 56 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q3_K_L/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_L-00006-of-00008.gguf filter=lfs diff=lfs merge=lfs -text
|
| 57 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q3_K_L/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_L-00007-of-00008.gguf filter=lfs diff=lfs merge=lfs -text
|
| 58 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q3_K_L/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_L-00008-of-00008.gguf filter=lfs diff=lfs merge=lfs -text
|
| 59 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q3_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_M-00001-of-00007.gguf filter=lfs diff=lfs merge=lfs -text
|
| 60 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q3_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_M-00002-of-00007.gguf filter=lfs diff=lfs merge=lfs -text
|
| 61 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q3_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_M-00003-of-00007.gguf filter=lfs diff=lfs merge=lfs -text
|
| 62 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q3_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_M-00004-of-00007.gguf filter=lfs diff=lfs merge=lfs -text
|
| 63 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q3_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_M-00005-of-00007.gguf filter=lfs diff=lfs merge=lfs -text
|
| 64 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q3_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_M-00006-of-00007.gguf filter=lfs diff=lfs merge=lfs -text
|
| 65 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q3_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_M-00007-of-00007.gguf filter=lfs diff=lfs merge=lfs -text
|
| 66 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q3_K_S/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_S-00001-of-00007.gguf filter=lfs diff=lfs merge=lfs -text
|
| 67 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q3_K_S/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_S-00002-of-00007.gguf filter=lfs diff=lfs merge=lfs -text
|
| 68 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q3_K_S/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_S-00003-of-00007.gguf filter=lfs diff=lfs merge=lfs -text
|
| 69 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q3_K_S/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_S-00004-of-00007.gguf filter=lfs diff=lfs merge=lfs -text
|
| 70 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q3_K_S/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_S-00005-of-00007.gguf filter=lfs diff=lfs merge=lfs -text
|
| 71 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q3_K_S/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_S-00006-of-00007.gguf filter=lfs diff=lfs merge=lfs -text
|
| 72 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q3_K_S/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_S-00007-of-00007.gguf filter=lfs diff=lfs merge=lfs -text
|
| 73 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M-00001-of-00009.gguf filter=lfs diff=lfs merge=lfs -text
|
| 74 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M-00002-of-00009.gguf filter=lfs diff=lfs merge=lfs -text
|
| 75 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M-00003-of-00009.gguf filter=lfs diff=lfs merge=lfs -text
|
| 76 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M-00004-of-00009.gguf filter=lfs diff=lfs merge=lfs -text
|
| 77 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M-00005-of-00009.gguf filter=lfs diff=lfs merge=lfs -text
|
| 78 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M-00006-of-00009.gguf filter=lfs diff=lfs merge=lfs -text
|
| 79 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M-00007-of-00009.gguf filter=lfs diff=lfs merge=lfs -text
|
| 80 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M-00008-of-00009.gguf filter=lfs diff=lfs merge=lfs -text
|
| 81 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M-00009-of-00009.gguf filter=lfs diff=lfs merge=lfs -text
|
| 82 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q4_K_S/nvidia-Llama3-ChatQA-1.5-70B-Q4_K_S-00001-of-00009.gguf filter=lfs diff=lfs merge=lfs -text
|
| 83 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q4_K_S/nvidia-Llama3-ChatQA-1.5-70B-Q4_K_S-00002-of-00009.gguf filter=lfs diff=lfs merge=lfs -text
|
| 84 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q4_K_S/nvidia-Llama3-ChatQA-1.5-70B-Q4_K_S-00003-of-00009.gguf filter=lfs diff=lfs merge=lfs -text
|
| 85 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q4_K_S/nvidia-Llama3-ChatQA-1.5-70B-Q4_K_S-00004-of-00009.gguf filter=lfs diff=lfs merge=lfs -text
|
| 86 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q4_K_S/nvidia-Llama3-ChatQA-1.5-70B-Q4_K_S-00005-of-00009.gguf filter=lfs diff=lfs merge=lfs -text
|
| 87 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q4_K_S/nvidia-Llama3-ChatQA-1.5-70B-Q4_K_S-00006-of-00009.gguf filter=lfs diff=lfs merge=lfs -text
|
| 88 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q4_K_S/nvidia-Llama3-ChatQA-1.5-70B-Q4_K_S-00007-of-00009.gguf filter=lfs diff=lfs merge=lfs -text
|
| 89 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q4_K_S/nvidia-Llama3-ChatQA-1.5-70B-Q4_K_S-00008-of-00009.gguf filter=lfs diff=lfs merge=lfs -text
|
| 90 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q4_K_S/nvidia-Llama3-ChatQA-1.5-70B-Q4_K_S-00009-of-00009.gguf filter=lfs diff=lfs merge=lfs -text
|
| 91 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q5_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q5_K_M-00001-of-00011.gguf filter=lfs diff=lfs merge=lfs -text
|
| 92 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q5_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q5_K_M-00002-of-00011.gguf filter=lfs diff=lfs merge=lfs -text
|
| 93 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q5_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q5_K_M-00003-of-00011.gguf filter=lfs diff=lfs merge=lfs -text
|
| 94 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q5_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q5_K_M-00004-of-00011.gguf filter=lfs diff=lfs merge=lfs -text
|
| 95 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q5_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q5_K_M-00005-of-00011.gguf filter=lfs diff=lfs merge=lfs -text
|
| 96 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q5_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q5_K_M-00006-of-00011.gguf filter=lfs diff=lfs merge=lfs -text
|
| 97 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q5_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q5_K_M-00007-of-00011.gguf filter=lfs diff=lfs merge=lfs -text
|
| 98 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q5_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q5_K_M-00008-of-00011.gguf filter=lfs diff=lfs merge=lfs -text
|
| 99 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q5_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q5_K_M-00009-of-00011.gguf filter=lfs diff=lfs merge=lfs -text
|
| 100 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q5_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q5_K_M-00010-of-00011.gguf filter=lfs diff=lfs merge=lfs -text
|
| 101 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q5_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q5_K_M-00011-of-00011.gguf filter=lfs diff=lfs merge=lfs -text
|
| 102 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q5_K_S/nvidia-Llama3-ChatQA-1.5-70B-Q5_K_S-00001-of-00010.gguf filter=lfs diff=lfs merge=lfs -text
|
| 103 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q5_K_S/nvidia-Llama3-ChatQA-1.5-70B-Q5_K_S-00002-of-00010.gguf filter=lfs diff=lfs merge=lfs -text
|
| 104 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q5_K_S/nvidia-Llama3-ChatQA-1.5-70B-Q5_K_S-00003-of-00010.gguf filter=lfs diff=lfs merge=lfs -text
|
| 105 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q5_K_S/nvidia-Llama3-ChatQA-1.5-70B-Q5_K_S-00004-of-00010.gguf filter=lfs diff=lfs merge=lfs -text
|
| 106 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q5_K_S/nvidia-Llama3-ChatQA-1.5-70B-Q5_K_S-00005-of-00010.gguf filter=lfs diff=lfs merge=lfs -text
|
| 107 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q5_K_S/nvidia-Llama3-ChatQA-1.5-70B-Q5_K_S-00006-of-00010.gguf filter=lfs diff=lfs merge=lfs -text
|
| 108 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q5_K_S/nvidia-Llama3-ChatQA-1.5-70B-Q5_K_S-00007-of-00010.gguf filter=lfs diff=lfs merge=lfs -text
|
| 109 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q5_K_S/nvidia-Llama3-ChatQA-1.5-70B-Q5_K_S-00008-of-00010.gguf filter=lfs diff=lfs merge=lfs -text
|
| 110 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q5_K_S/nvidia-Llama3-ChatQA-1.5-70B-Q5_K_S-00009-of-00010.gguf filter=lfs diff=lfs merge=lfs -text
|
| 111 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q5_K_S/nvidia-Llama3-ChatQA-1.5-70B-Q5_K_S-00010-of-00010.gguf filter=lfs diff=lfs merge=lfs -text
|
| 112 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q6_K/nvidia-Llama3-ChatQA-1.5-70B-Q6_K-00001-of-00012.gguf filter=lfs diff=lfs merge=lfs -text
|
| 113 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q6_K/nvidia-Llama3-ChatQA-1.5-70B-Q6_K-00002-of-00012.gguf filter=lfs diff=lfs merge=lfs -text
|
| 114 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q6_K/nvidia-Llama3-ChatQA-1.5-70B-Q6_K-00003-of-00012.gguf filter=lfs diff=lfs merge=lfs -text
|
| 115 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q6_K/nvidia-Llama3-ChatQA-1.5-70B-Q6_K-00004-of-00012.gguf filter=lfs diff=lfs merge=lfs -text
|
| 116 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q6_K/nvidia-Llama3-ChatQA-1.5-70B-Q6_K-00005-of-00012.gguf filter=lfs diff=lfs merge=lfs -text
|
| 117 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q6_K/nvidia-Llama3-ChatQA-1.5-70B-Q6_K-00006-of-00012.gguf filter=lfs diff=lfs merge=lfs -text
|
| 118 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q6_K/nvidia-Llama3-ChatQA-1.5-70B-Q6_K-00007-of-00012.gguf filter=lfs diff=lfs merge=lfs -text
|
| 119 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q6_K/nvidia-Llama3-ChatQA-1.5-70B-Q6_K-00008-of-00012.gguf filter=lfs diff=lfs merge=lfs -text
|
| 120 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q6_K/nvidia-Llama3-ChatQA-1.5-70B-Q6_K-00009-of-00012.gguf filter=lfs diff=lfs merge=lfs -text
|
| 121 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q6_K/nvidia-Llama3-ChatQA-1.5-70B-Q6_K-00010-of-00012.gguf filter=lfs diff=lfs merge=lfs -text
|
| 122 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q6_K/nvidia-Llama3-ChatQA-1.5-70B-Q6_K-00011-of-00012.gguf filter=lfs diff=lfs merge=lfs -text
|
| 123 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q6_K/nvidia-Llama3-ChatQA-1.5-70B-Q6_K-00012-of-00012.gguf filter=lfs diff=lfs merge=lfs -text
|
| 124 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q8_0/nvidia-Llama3-ChatQA-1.5-70B-Q8_0-00001-of-00016.gguf filter=lfs diff=lfs merge=lfs -text
|
| 125 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q8_0/nvidia-Llama3-ChatQA-1.5-70B-Q8_0-00002-of-00016.gguf filter=lfs diff=lfs merge=lfs -text
|
| 126 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q8_0/nvidia-Llama3-ChatQA-1.5-70B-Q8_0-00003-of-00016.gguf filter=lfs diff=lfs merge=lfs -text
|
| 127 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q8_0/nvidia-Llama3-ChatQA-1.5-70B-Q8_0-00004-of-00016.gguf filter=lfs diff=lfs merge=lfs -text
|
| 128 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q8_0/nvidia-Llama3-ChatQA-1.5-70B-Q8_0-00005-of-00016.gguf filter=lfs diff=lfs merge=lfs -text
|
| 129 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q8_0/nvidia-Llama3-ChatQA-1.5-70B-Q8_0-00006-of-00016.gguf filter=lfs diff=lfs merge=lfs -text
|
| 130 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q8_0/nvidia-Llama3-ChatQA-1.5-70B-Q8_0-00007-of-00016.gguf filter=lfs diff=lfs merge=lfs -text
|
| 131 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q8_0/nvidia-Llama3-ChatQA-1.5-70B-Q8_0-00008-of-00016.gguf filter=lfs diff=lfs merge=lfs -text
|
| 132 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q8_0/nvidia-Llama3-ChatQA-1.5-70B-Q8_0-00009-of-00016.gguf filter=lfs diff=lfs merge=lfs -text
|
| 133 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q8_0/nvidia-Llama3-ChatQA-1.5-70B-Q8_0-00010-of-00016.gguf filter=lfs diff=lfs merge=lfs -text
|
| 134 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q8_0/nvidia-Llama3-ChatQA-1.5-70B-Q8_0-00011-of-00016.gguf filter=lfs diff=lfs merge=lfs -text
|
| 135 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q8_0/nvidia-Llama3-ChatQA-1.5-70B-Q8_0-00012-of-00016.gguf filter=lfs diff=lfs merge=lfs -text
|
| 136 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q8_0/nvidia-Llama3-ChatQA-1.5-70B-Q8_0-00013-of-00016.gguf filter=lfs diff=lfs merge=lfs -text
|
| 137 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q8_0/nvidia-Llama3-ChatQA-1.5-70B-Q8_0-00014-of-00016.gguf filter=lfs diff=lfs merge=lfs -text
|
| 138 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q8_0/nvidia-Llama3-ChatQA-1.5-70B-Q8_0-00015-of-00016.gguf filter=lfs diff=lfs merge=lfs -text
|
| 139 |
+
nvidia-Llama3-ChatQA-1.5-70B-Q8_0/nvidia-Llama3-ChatQA-1.5-70B-Q8_0-00016-of-00016.gguf filter=lfs diff=lfs merge=lfs -text
|
README.md
ADDED
|
@@ -0,0 +1,47 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
---
|
| 2 |
+
base_model: nvidia/Llama3-ChatQA-1.5-70B
|
| 3 |
+
pipeline_tag: text-generation
|
| 4 |
+
quantized_by: featherless-ai-quants
|
| 5 |
+
---
|
| 6 |
+
|
| 7 |
+
# nvidia/Llama3-ChatQA-1.5-70B GGUF Quantizations 🚀
|
| 8 |
+
|
| 9 |
+

|
| 10 |
+
|
| 11 |
+
*Optimized GGUF quantization files for enhanced model performance*
|
| 12 |
+
|
| 13 |
+
> Powered by [Featherless AI](https://featherless.ai) - run any model you'd like for a simple small fee.
|
| 14 |
+
---
|
| 15 |
+
|
| 16 |
+
## Available Quantizations 📊
|
| 17 |
+
|
| 18 |
+
| Quantization Type | File | Size |
|
| 19 |
+
|-------------------|------|------|
|
| 20 |
+
| IQ4_XS | [nvidia-Llama3-ChatQA-1.5-70B-IQ4_XS](https://huggingface.co/featherless-ai-quants/nvidia-Llama3-ChatQA-1.5-70B-GGUF/tree/main/nvidia-Llama3-ChatQA-1.5-70B-IQ4_XS) | 36496.80 MB (folder) |
|
| 21 |
+
| Q2_K | [nvidia-Llama3-ChatQA-1.5-70B-Q2_K](https://huggingface.co/featherless-ai-quants/nvidia-Llama3-ChatQA-1.5-70B-GGUF/tree/main/nvidia-Llama3-ChatQA-1.5-70B-Q2_K) | 25153.26 MB (folder) |
|
| 22 |
+
| Q3_K_L | [nvidia-Llama3-ChatQA-1.5-70B-Q3_K_L](https://huggingface.co/featherless-ai-quants/nvidia-Llama3-ChatQA-1.5-70B-GGUF/tree/main/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_L) | 35420.03 MB (folder) |
|
| 23 |
+
| Q3_K_M | [nvidia-Llama3-ChatQA-1.5-70B-Q3_K_M](https://huggingface.co/featherless-ai-quants/nvidia-Llama3-ChatQA-1.5-70B-GGUF/tree/main/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_M) | 32680.03 MB (folder) |
|
| 24 |
+
| Q3_K_S | [nvidia-Llama3-ChatQA-1.5-70B-Q3_K_S](https://huggingface.co/featherless-ai-quants/nvidia-Llama3-ChatQA-1.5-70B-GGUF/tree/main/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_S) | 29480.03 MB (folder) |
|
| 25 |
+
| Q4_K_M | [nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M](https://huggingface.co/featherless-ai-quants/nvidia-Llama3-ChatQA-1.5-70B-GGUF/tree/main/nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M) | 40550.61 MB (folder) |
|
| 26 |
+
| Q4_K_S | [nvidia-Llama3-ChatQA-1.5-70B-Q4_K_S](https://huggingface.co/featherless-ai-quants/nvidia-Llama3-ChatQA-1.5-70B-GGUF/tree/main/nvidia-Llama3-ChatQA-1.5-70B-Q4_K_S) | 38478.11 MB (folder) |
|
| 27 |
+
| Q5_K_M | [nvidia-Llama3-ChatQA-1.5-70B-Q5_K_M](https://huggingface.co/featherless-ai-quants/nvidia-Llama3-ChatQA-1.5-70B-GGUF/tree/main/nvidia-Llama3-ChatQA-1.5-70B-Q5_K_M) | 47635.86 MB (folder) |
|
| 28 |
+
| Q5_K_S | [nvidia-Llama3-ChatQA-1.5-70B-Q5_K_S](https://huggingface.co/featherless-ai-quants/nvidia-Llama3-ChatQA-1.5-70B-GGUF/tree/main/nvidia-Llama3-ChatQA-1.5-70B-Q5_K_S) | 46403.36 MB (folder) |
|
| 29 |
+
| Q6_K | [nvidia-Llama3-ChatQA-1.5-70B-Q6_K](https://huggingface.co/featherless-ai-quants/nvidia-Llama3-ChatQA-1.5-70B-GGUF/tree/main/nvidia-Llama3-ChatQA-1.5-70B-Q6_K) | 55206.44 MB (folder) |
|
| 30 |
+
| Q8_0 | [nvidia-Llama3-ChatQA-1.5-70B-Q8_0](https://huggingface.co/featherless-ai-quants/nvidia-Llama3-ChatQA-1.5-70B-GGUF/tree/main/nvidia-Llama3-ChatQA-1.5-70B-Q8_0) | 71501.78 MB (folder) |
|
| 31 |
+
|
| 32 |
+
|
| 33 |
+
---
|
| 34 |
+
|
| 35 |
+
## ⚡ Powered by [Featherless AI](https://featherless.ai)
|
| 36 |
+
|
| 37 |
+
### Key Features
|
| 38 |
+
|
| 39 |
+
- 🔥 **Instant Hosting** - Deploy any Llama model on HuggingFace instantly
|
| 40 |
+
- 🛠️ **Zero Infrastructure** - No server setup or maintenance required
|
| 41 |
+
- 📚 **Vast Compatibility** - Support for 2400+ models and counting
|
| 42 |
+
- 💎 **Affordable Pricing** - Starting at just $10/month
|
| 43 |
+
|
| 44 |
+
---
|
| 45 |
+
|
| 46 |
+
**Links:**
|
| 47 |
+
[Get Started](https://featherless.ai) | [Documentation](https://featherless.ai/docs) | [Models](https://featherless.ai/models)
|
featherless-quants.png
ADDED
|
Git LFS Details
|
nvidia-Llama3-ChatQA-1.5-70B-IQ4_XS/nvidia-Llama3-ChatQA-1.5-70B-IQ4_XS-00001-of-00008.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a2f64ddf6dd775a0a29e9de6c52f927016b8aa8dab2981b1c1e72b781667f5f0
|
| 3 |
+
size 5004223488
|
nvidia-Llama3-ChatQA-1.5-70B-IQ4_XS/nvidia-Llama3-ChatQA-1.5-70B-IQ4_XS-00002-of-00008.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1fe506900306a015a1d741765b5322779570d53ded0241d418392733ab3a0699
|
| 3 |
+
size 4970386976
|
nvidia-Llama3-ChatQA-1.5-70B-IQ4_XS/nvidia-Llama3-ChatQA-1.5-70B-IQ4_XS-00003-of-00008.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:efaab75c0841fa71fbea6cd3da51ca58e82bf6da4ec1333732274fd251044037
|
| 3 |
+
size 4886009568
|
nvidia-Llama3-ChatQA-1.5-70B-IQ4_XS/nvidia-Llama3-ChatQA-1.5-70B-IQ4_XS-00004-of-00008.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ffb030ce81e7c1cc6ceebb5b0c2c251a1784e51f8bb86c1a20a8b2615d3a32f2
|
| 3 |
+
size 4890498912
|
nvidia-Llama3-ChatQA-1.5-70B-IQ4_XS/nvidia-Llama3-ChatQA-1.5-70B-IQ4_XS-00005-of-00008.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a4d0d88ab9f055f9aaaad653940316de62f56944c9aecc2ce3e0359afb62e200
|
| 3 |
+
size 4890498912
|
nvidia-Llama3-ChatQA-1.5-70B-IQ4_XS/nvidia-Llama3-ChatQA-1.5-70B-IQ4_XS-00006-of-00008.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:96965f81952f7079e6fa20456d54b78bb2932571791a61196f6fe09ed500ec0d
|
| 3 |
+
size 4973827808
|
nvidia-Llama3-ChatQA-1.5-70B-IQ4_XS/nvidia-Llama3-ChatQA-1.5-70B-IQ4_XS-00007-of-00008.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dcf08867de0344f427e0d1cbd959cdf29852d4728b846faa0d17e38a9457481f
|
| 3 |
+
size 4931917792
|
nvidia-Llama3-ChatQA-1.5-70B-IQ4_XS/nvidia-Llama3-ChatQA-1.5-70B-IQ4_XS-00008-of-00008.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8f1817f8e8d069d707a3555bc47c51a7e20c9e4ed8216379c6c44acc41b779b1
|
| 3 |
+
size 3722300864
|
nvidia-Llama3-ChatQA-1.5-70B-Q2_K/nvidia-Llama3-ChatQA-1.5-70B-Q2_K-00001-of-00006.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bbebb4a39f765f38a2daed698e45ddc386c235a16eeb6d2134fee06e8cb5344e
|
| 3 |
+
size 4933709440
|
nvidia-Llama3-ChatQA-1.5-70B-Q2_K/nvidia-Llama3-ChatQA-1.5-70B-Q2_K-00002-of-00006.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d711264f32b5a0aa628198b1f8c91cf67f828d6fc87c8b251ec4757116d5aa99
|
| 3 |
+
size 4955054560
|
nvidia-Llama3-ChatQA-1.5-70B-Q2_K/nvidia-Llama3-ChatQA-1.5-70B-Q2_K-00003-of-00006.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ca7ee50b4974db4405e314794c0d19b54fff7a3fd741f3bff21f370855873c1e
|
| 3 |
+
size 4931199456
|
nvidia-Llama3-ChatQA-1.5-70B-Q2_K/nvidia-Llama3-ChatQA-1.5-70B-Q2_K-00004-of-00006.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a6827adf0ccbafa123c8f320e500195a6f88d0abd4a80003de35b10616edc21d
|
| 3 |
+
size 4975468832
|
nvidia-Llama3-ChatQA-1.5-70B-Q2_K/nvidia-Llama3-ChatQA-1.5-70B-Q2_K-00005-of-00006.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:016a46b4174f0a5e68a967c7e054da37dfdaf12e34997036d62aaa9b3792bed3
|
| 3 |
+
size 4952269152
|
nvidia-Llama3-ChatQA-1.5-70B-Q2_K/nvidia-Llama3-ChatQA-1.5-70B-Q2_K-00006-of-00006.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c8424fdea3608b53cbf4ef990ff160192df43eed490fb08d9e7e68df40826e69
|
| 3 |
+
size 1627408000
|
nvidia-Llama3-ChatQA-1.5-70B-Q3_K_L/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_L-00001-of-00008.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d39ad1fea86a35de1c1ee959929596097093157e301b22f1e8448803811de16a
|
| 3 |
+
size 4986512992
|
nvidia-Llama3-ChatQA-1.5-70B-Q3_K_L/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_L-00002-of-00008.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9ede26fb10801bb4aa968d11da4b53f7cad99309fcf98986e08c50f866c01991
|
| 3 |
+
size 4976318240
|
nvidia-Llama3-ChatQA-1.5-70B-Q3_K_L/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_L-00003-of-00008.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6f71d01b54f35cf4136c6123769c20c8d92cde9a0079d590ca02609e0e1b19d0
|
| 3 |
+
size 4985722784
|
nvidia-Llama3-ChatQA-1.5-70B-Q3_K_L/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_L-00004-of-00008.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8cfaa18b8dde7bdd5b4a4a94d8aad06553db1be546cbd3816bbc7887610488a2
|
| 3 |
+
size 4925167520
|
nvidia-Llama3-ChatQA-1.5-70B-Q3_K_L/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_L-00005-of-00008.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:70c0868b6565211eef91222d032addcbd905c7d5d1f7b61b95309835c41246b8
|
| 3 |
+
size 4925167520
|
nvidia-Llama3-ChatQA-1.5-70B-Q3_K_L/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_L-00006-of-00008.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b2ae2c6a10d762b4700191decd774c261b6eb8cc023c377e2bdc9f5f4db7fe8b
|
| 3 |
+
size 4925167520
|
nvidia-Llama3-ChatQA-1.5-70B-Q3_K_L/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_L-00007-of-00008.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:969f89e19651c4f74995c0a9212edcdb46a9ce1b68af54ad38bedb87a06c68d2
|
| 3 |
+
size 4925167520
|
nvidia-Llama3-ChatQA-1.5-70B-Q3_K_L/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_L-00008-of-00008.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8adc0ab10ddd3369f0f8f9e5563a0abe37510c030821b9b2d30e312f9e080b62
|
| 3 |
+
size 2491369696
|
nvidia-Llama3-ChatQA-1.5-70B-Q3_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_M-00001-of-00007.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1dcc8c83804ec90e14cd847c8e7b32cef5dc304d360729b4966b6c63c602a5e1
|
| 3 |
+
size 4914161408
|
nvidia-Llama3-ChatQA-1.5-70B-Q3_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_M-00002-of-00007.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e61900b1b6c7fa05163b762ea15640f6373dcd210cec751a1db08532644edc02
|
| 3 |
+
size 4944861376
|
nvidia-Llama3-ChatQA-1.5-70B-Q3_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_M-00003-of-00007.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7d9da8a468f4204448737e9c00b8506652b997fe459066fc1ae9cc2a15df95dc
|
| 3 |
+
size 4919925184
|
nvidia-Llama3-ChatQA-1.5-70B-Q3_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_M-00004-of-00007.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a6f6add205dd0216026565967eb719d0f956eff2c34eee76baad590200b06c13
|
| 3 |
+
size 4919925184
|
nvidia-Llama3-ChatQA-1.5-70B-Q3_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_M-00005-of-00007.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4915ca59ac91f4d00a77c22e5fd430563f631d3945b037dd567c3d549c3a5f63
|
| 3 |
+
size 4919925184
|
nvidia-Llama3-ChatQA-1.5-70B-Q3_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_M-00006-of-00007.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:31f7959cc24efb3237b313060f6ab7f5ebed4dd435bea42a29caa570812a95e1
|
| 3 |
+
size 4919925184
|
nvidia-Llama3-ChatQA-1.5-70B-Q3_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_M-00007-of-00007.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:35e1375a9b9f13d3aeb45bb2a4c92c4d117ac2ab635fc2a9190aa08fb608084a
|
| 3 |
+
size 4728771904
|
nvidia-Llama3-ChatQA-1.5-70B-Q3_K_S/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_S-00001-of-00007.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:373ae41dd6651f7e4f602fc2aeeb524c0f234c55d269c673699f81766b471980
|
| 3 |
+
size 4998867488
|
nvidia-Llama3-ChatQA-1.5-70B-Q3_K_S/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_S-00002-of-00007.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5fd968f96b139c5b7fbb781e35da97504332ac60ac403be1d2a0b02a2f9eafd4
|
| 3 |
+
size 4909440000
|
nvidia-Llama3-ChatQA-1.5-70B-Q3_K_S/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_S-00003-of-00007.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cfabfea38ffb7358b5b26561ce8ef989391fb87b59b4a610ba16980b8fd74088
|
| 3 |
+
size 4976549216
|
nvidia-Llama3-ChatQA-1.5-70B-Q3_K_S/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_S-00004-of-00007.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4704dd531d42f52416de7d934b0fc27718c0b74aae8d5b6cd165ac695cfdd78c
|
| 3 |
+
size 4909440000
|
nvidia-Llama3-ChatQA-1.5-70B-Q3_K_S/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_S-00005-of-00007.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:150f1b8c80e3b949d02ee05fb6ef27c094949fb8fbef1334c3a99260acc8e882
|
| 3 |
+
size 4909440000
|
nvidia-Llama3-ChatQA-1.5-70B-Q3_K_S/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_S-00006-of-00007.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7a8e44eed70e4943d89b8ad1689ffb264578fabd74931835b3a82d94ffd36bae
|
| 3 |
+
size 4980186592
|
nvidia-Llama3-ChatQA-1.5-70B-Q3_K_S/nvidia-Llama3-ChatQA-1.5-70B-Q3_K_S-00007-of-00007.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6a9b42017df8cf27d75f957ff8e9f294264d893cbcc9e114b85da5e08f422717
|
| 3 |
+
size 1228128864
|
nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M-00001-of-00009.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7b9d48efbb1a702a5f723e81913288d6eae48d144f552d2a2030c51d2a1ee563
|
| 3 |
+
size 4993999424
|
nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M-00002-of-00009.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:89150ca5091b777ce2d0e1ffdc2a601c47f23e51116255cd9fb36f92c884189d
|
| 3 |
+
size 4984738816
|
nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M-00003-of-00009.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d13a188e00489d373e220dd660bc4ca19358c816e090b4a42439752aa73fff7e
|
| 3 |
+
size 4982183360
|
nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M-00004-of-00009.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ea995e551ef362f32e4c2999cb2d39288bca5a22b6670ca16b2675a8f51f9a54
|
| 3 |
+
size 4923102304
|
nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M-00005-of-00009.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:df72464bda183d18c5f5b9e5f18b0d85605c1523542dde68e175bb213ed2b5aa
|
| 3 |
+
size 4876997952
|
nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M-00006-of-00009.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1e4bc37fbac77e2ab0ffc74f55f082e785674870712c1de9d75bf2e12f84800f
|
| 3 |
+
size 4876997952
|
nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M-00007-of-00009.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8e4bc36d67a1d6f2f4b0652a2598ec3b3eba284e6963c30ce47aa694c953edbc
|
| 3 |
+
size 4988376192
|
nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M-00008-of-00009.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:849b33a04842a2b78ced2a11acf4c852a4dbafe827ae5f20d188ed7b824cbae5
|
| 3 |
+
size 4855796832
|
nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M/nvidia-Llama3-ChatQA-1.5-70B-Q4_K_M-00009-of-00009.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:de163661b41829992dd6248a73a3116af4cf854ecbceee94df54443a30c6ade6
|
| 3 |
+
size 3038202144
|
nvidia-Llama3-ChatQA-1.5-70B-Q4_K_S/nvidia-Llama3-ChatQA-1.5-70B-Q4_K_S-00001-of-00009.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ee1d2935780fd92e939b4d9d5434a750e0e3460089e99c876056d52ed4b9da0e
|
| 3 |
+
size 4940555040
|
nvidia-Llama3-ChatQA-1.5-70B-Q4_K_S/nvidia-Llama3-ChatQA-1.5-70B-Q4_K_S-00002-of-00009.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7b31c42e5e2302f6e05a911843d4c72c47da17034c3bf3e2c3bef724e41b7beb
|
| 3 |
+
size 4899542080
|