David Huang commited on
Commit
39918fb
·
1 Parent(s): 1010849
Files changed (21) hide show
  1. .gitattributes +1 -0
  2. Q8_0-EXP-Q4_0/.gitattributes +17 -0
  3. Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00001-of-00017.gguf +3 -0
  4. Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00002-of-00017.gguf +3 -0
  5. Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00003-of-00017.gguf +3 -0
  6. Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00004-of-00017.gguf +3 -0
  7. Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00005-of-00017.gguf +3 -0
  8. Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00006-of-00017.gguf +3 -0
  9. Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00007-of-00017.gguf +3 -0
  10. Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00008-of-00017.gguf +3 -0
  11. Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00009-of-00017.gguf +3 -0
  12. Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00010-of-00017.gguf +3 -0
  13. Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00011-of-00017.gguf +3 -0
  14. Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00012-of-00017.gguf +3 -0
  15. Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00013-of-00017.gguf +3 -0
  16. Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00014-of-00017.gguf +3 -0
  17. Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00015-of-00017.gguf +3 -0
  18. Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00016-of-00017.gguf +3 -0
  19. Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00017-of-00017.gguf +3 -0
  20. README.md +5 -1
  21. mmproj-llama4-109b.gguf +3 -0
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ mmproj-llama4-109b.gguf filter=lfs diff=lfs merge=lfs -text
Q8_0-EXP-Q4_0/.gitattributes ADDED
@@ -0,0 +1,17 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00013-of-00017.gguf filter=lfs diff=lfs merge=lfs -text
2
+ Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00014-of-00017.gguf filter=lfs diff=lfs merge=lfs -text
3
+ Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00017-of-00017.gguf filter=lfs diff=lfs merge=lfs -text
4
+ Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00003-of-00017.gguf filter=lfs diff=lfs merge=lfs -text
5
+ Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00012-of-00017.gguf filter=lfs diff=lfs merge=lfs -text
6
+ Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00001-of-00017.gguf filter=lfs diff=lfs merge=lfs -text
7
+ Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00002-of-00017.gguf filter=lfs diff=lfs merge=lfs -text
8
+ Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00007-of-00017.gguf filter=lfs diff=lfs merge=lfs -text
9
+ Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00008-of-00017.gguf filter=lfs diff=lfs merge=lfs -text
10
+ Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00009-of-00017.gguf filter=lfs diff=lfs merge=lfs -text
11
+ Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00010-of-00017.gguf filter=lfs diff=lfs merge=lfs -text
12
+ Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00016-of-00017.gguf filter=lfs diff=lfs merge=lfs -text
13
+ Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00004-of-00017.gguf filter=lfs diff=lfs merge=lfs -text
14
+ Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00005-of-00017.gguf filter=lfs diff=lfs merge=lfs -text
15
+ Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00006-of-00017.gguf filter=lfs diff=lfs merge=lfs -text
16
+ Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00015-of-00017.gguf filter=lfs diff=lfs merge=lfs -text
17
+ Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00011-of-00017.gguf filter=lfs diff=lfs merge=lfs -text
Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00001-of-00017.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:abe5f385deceda3efb3ce0561722f13575e2bfa8ed74cd6c04a27333d06eb544
3
+ size 3989088224
Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00002-of-00017.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:add9d0846160017d9bc4ab09b8103c2f36097cfd2cef0f9dd475c99a73f0ad9a
3
+ size 3622627808
Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00003-of-00017.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb1ee2d1c538900bd72bde57ae940d095db9f008f4110e765b751099f319e8a8
3
+ size 3994544640
Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00004-of-00017.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ab90e4876d711565c529146a7f9d9c9e9b1418af01959cae82d2b54a3f906a7
3
+ size 3972262400
Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00005-of-00017.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8df253c01c578e88850b935415f9d0143929296b291ce3a59cf97eaff05fe4bf
3
+ size 3972262432
Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00006-of-00017.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e61a23b2964e08be7ea0c70aa16cf71d59cbed1c99a4ff351f727fc1023f809
3
+ size 3994524128
Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00007-of-00017.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ce9b0e0f4e6d4e0a42b9f6bb1b723b015fe91888a3537e6f534672d5dfddcdc
3
+ size 3955550752
Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00008-of-00017.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fd5d87d6b5392831d33ae4c10145499bdb12e84518b08ca6d9293df5ca1ed66e
3
+ size 3622627872
Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00009-of-00017.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8355889448b4c3e25bf88b9ba4058c5b48412b5be0572c01ca0e61af7989b0c7
3
+ size 3955530208
Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00010-of-00017.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cdac789d4c512761889dfeeb1937e515f7952fe5d9c0d42ad005047e75b02fb8
3
+ size 3999787552
Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00011-of-00017.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:36b30f9b84d35492d3822e53300dbd028309d98dc1e048103159e7b4509ed30d
3
+ size 3622627872
Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00012-of-00017.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:53dbda53bc9e4f288c6af8433aa0cd1efe1bb71a7889bd6965170abc9956a8fe
3
+ size 3955550752
Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00013-of-00017.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f76f2e5ee9864027fead03c3ccdbdede1f0521232af046ab15e3a5cbdfb0d528
3
+ size 3622627872
Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00014-of-00017.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb05e41320e149b1431e577797faf6452868d63e5587f00d53a7e219c3ff1996
3
+ size 3994544672
Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00015-of-00017.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1fcb66fd4b34e27464cce8966f4ba2f33df34dada79b4747d631e87ca8db9305
3
+ size 3972262432
Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00016-of-00017.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e9bea4eebf49e1bf448d49290970c3d75b8a62adec52cff1fe2950a200db616d
3
+ size 3972262432
Q8_0-EXP-Q4_0/Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0-00017-of-00017.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:74db746ec244c2e03587e4440bb1f6ee555c8064232912e7be88b73972f837e3
3
+ size 3994524128
README.md CHANGED
@@ -2,4 +2,8 @@
2
  license: llama4
3
  base_model:
4
  - meta-llama/Llama-4-Scout-17B-16E-Instruct
5
- ---
 
 
 
 
 
2
  license: llama4
3
  base_model:
4
  - meta-llama/Llama-4-Scout-17B-16E-Instruct
5
+ ---
6
+
7
+ ```
8
+ llama-quantize --tensor-type ffn_down_exps=q4_0 --tensor-type ffn_gate_exps=q4_0 --tensor-type ffn_up_exps=q4_0 Llama-4-Scout-17B-16E-Instruct.gguf Llama-4-Scout-17B-16E-Instruct-GGUF-Q8_0-EXP-Q4_0.gguf q8_0
9
+ ```
mmproj-llama4-109b.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d73d72ef2b4c6b8022b7ef88df4f0dcd648258ff5951a10cd1c810219adfaafd
3
+ size 1746780768