David Huang
commited on
Commit
·
39918fb
1
Parent(s):
1010849
update
Browse files- .gitattributes +1 -0
- Q8_0-EXP-Q4_0/.gitattributes +17 -0
- Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00001-of-00017.gguf +3 -0
- Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00002-of-00017.gguf +3 -0
- Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00003-of-00017.gguf +3 -0
- Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00004-of-00017.gguf +3 -0
- Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00005-of-00017.gguf +3 -0
- Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00006-of-00017.gguf +3 -0
- Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00007-of-00017.gguf +3 -0
- Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00008-of-00017.gguf +3 -0
- Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00009-of-00017.gguf +3 -0
- Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00010-of-00017.gguf +3 -0
- Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00011-of-00017.gguf +3 -0
- Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00012-of-00017.gguf +3 -0
- Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00013-of-00017.gguf +3 -0
- Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00014-of-00017.gguf +3 -0
- Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00015-of-00017.gguf +3 -0
- Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00016-of-00017.gguf +3 -0
- Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00017-of-00017.gguf +3 -0
- README.md +5 -1
- mmproj-llama4-109b.gguf +3 -0
.gitattributes
CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
+
mmproj-llama4-109b.gguf filter=lfs diff=lfs merge=lfs -text
|
Q8_0-EXP-Q4_0/.gitattributes
ADDED
@@ -0,0 +1,17 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00013-of-00017.gguf filter=lfs diff=lfs merge=lfs -text
|
2 |
+
Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00014-of-00017.gguf filter=lfs diff=lfs merge=lfs -text
|
3 |
+
Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00017-of-00017.gguf filter=lfs diff=lfs merge=lfs -text
|
4 |
+
Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00003-of-00017.gguf filter=lfs diff=lfs merge=lfs -text
|
5 |
+
Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00012-of-00017.gguf filter=lfs diff=lfs merge=lfs -text
|
6 |
+
Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00001-of-00017.gguf filter=lfs diff=lfs merge=lfs -text
|
7 |
+
Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00002-of-00017.gguf filter=lfs diff=lfs merge=lfs -text
|
8 |
+
Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00007-of-00017.gguf filter=lfs diff=lfs merge=lfs -text
|
9 |
+
Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00008-of-00017.gguf filter=lfs diff=lfs merge=lfs -text
|
10 |
+
Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00009-of-00017.gguf filter=lfs diff=lfs merge=lfs -text
|
11 |
+
Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00010-of-00017.gguf filter=lfs diff=lfs merge=lfs -text
|
12 |
+
Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00016-of-00017.gguf filter=lfs diff=lfs merge=lfs -text
|
13 |
+
Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00004-of-00017.gguf filter=lfs diff=lfs merge=lfs -text
|
14 |
+
Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00005-of-00017.gguf filter=lfs diff=lfs merge=lfs -text
|
15 |
+
Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00006-of-00017.gguf filter=lfs diff=lfs merge=lfs -text
|
16 |
+
Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00015-of-00017.gguf filter=lfs diff=lfs merge=lfs -text
|
17 |
+
Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00011-of-00017.gguf filter=lfs diff=lfs merge=lfs -text
|
Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00001-of-00017.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:abe5f385deceda3efb3ce0561722f13575e2bfa8ed74cd6c04a27333d06eb544
|
3 |
+
size 3989088224
|
Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00002-of-00017.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:add9d0846160017d9bc4ab09b8103c2f36097cfd2cef0f9dd475c99a73f0ad9a
|
3 |
+
size 3622627808
|
Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00003-of-00017.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cb1ee2d1c538900bd72bde57ae940d095db9f008f4110e765b751099f319e8a8
|
3 |
+
size 3994544640
|
Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00004-of-00017.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2ab90e4876d711565c529146a7f9d9c9e9b1418af01959cae82d2b54a3f906a7
|
3 |
+
size 3972262400
|
Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00005-of-00017.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8df253c01c578e88850b935415f9d0143929296b291ce3a59cf97eaff05fe4bf
|
3 |
+
size 3972262432
|
Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00006-of-00017.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3e61a23b2964e08be7ea0c70aa16cf71d59cbed1c99a4ff351f727fc1023f809
|
3 |
+
size 3994524128
|
Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00007-of-00017.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6ce9b0e0f4e6d4e0a42b9f6bb1b723b015fe91888a3537e6f534672d5dfddcdc
|
3 |
+
size 3955550752
|
Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00008-of-00017.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fd5d87d6b5392831d33ae4c10145499bdb12e84518b08ca6d9293df5ca1ed66e
|
3 |
+
size 3622627872
|
Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00009-of-00017.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8355889448b4c3e25bf88b9ba4058c5b48412b5be0572c01ca0e61af7989b0c7
|
3 |
+
size 3955530208
|
Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00010-of-00017.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cdac789d4c512761889dfeeb1937e515f7952fe5d9c0d42ad005047e75b02fb8
|
3 |
+
size 3999787552
|
Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00011-of-00017.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:36b30f9b84d35492d3822e53300dbd028309d98dc1e048103159e7b4509ed30d
|
3 |
+
size 3622627872
|
Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00012-of-00017.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:53dbda53bc9e4f288c6af8433aa0cd1efe1bb71a7889bd6965170abc9956a8fe
|
3 |
+
size 3955550752
|
Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00013-of-00017.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f76f2e5ee9864027fead03c3ccdbdede1f0521232af046ab15e3a5cbdfb0d528
|
3 |
+
size 3622627872
|
Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00014-of-00017.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cb05e41320e149b1431e577797faf6452868d63e5587f00d53a7e219c3ff1996
|
3 |
+
size 3994544672
|
Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00015-of-00017.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1fcb66fd4b34e27464cce8966f4ba2f33df34dada79b4747d631e87ca8db9305
|
3 |
+
size 3972262432
|
Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00016-of-00017.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e9bea4eebf49e1bf448d49290970c3d75b8a62adec52cff1fe2950a200db616d
|
3 |
+
size 3972262432
|
Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00017-of-00017.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:74db746ec244c2e03587e4440bb1f6ee555c8064232912e7be88b73972f837e3
|
3 |
+
size 3994524128
|
README.md
CHANGED
@@ -2,4 +2,8 @@
|
|
2 |
license: llama4
|
3 |
base_model:
|
4 |
- meta-llama/Llama-4-Scout-17B-16E-Instruct
|
5 |
-
---
|
|
|
|
|
|
|
|
|
|
2 |
license: llama4
|
3 |
base_model:
|
4 |
- meta-llama/Llama-4-Scout-17B-16E-Instruct
|
5 |
+
---
|
6 |
+
|
7 |
+
```
|
8 |
+
llama-quantize --tensor-type ffn_down_exps=q4_0 --tensor-type ffn_gate_exps=q4_0 --tensor-type ffn_up_exps=q4_0 Llama-4-Scout-17B-16E-Instruct.gguf Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0.gguf q8_0
|
9 |
+
```
|
mmproj-llama4-109b.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d73d72ef2b4c6b8022b7ef88df4f0dcd648258ff5951a10cd1c810219adfaafd
|
3 |
+
size 1746780768
|