Llamacpp quants
Browse files- README.md +4 -2
- gemma-2-9b-it-IQ2_M.gguf +2 -2
- gemma-2-9b-it-IQ2_S.gguf +2 -2
- gemma-2-9b-it-IQ2_XS.gguf +2 -2
- gemma-2-9b-it-IQ3_M.gguf +2 -2
- gemma-2-9b-it-IQ3_XS.gguf +2 -2
- gemma-2-9b-it-IQ3_XXS.gguf +2 -2
- gemma-2-9b-it-IQ4_XS.gguf +2 -2
- gemma-2-9b-it-Q2_K.gguf +2 -2
- gemma-2-9b-it-Q2_K_L.gguf +2 -2
- gemma-2-9b-it-Q3_K_L.gguf +2 -2
- gemma-2-9b-it-Q3_K_M.gguf +2 -2
- gemma-2-9b-it-Q3_K_S.gguf +2 -2
- gemma-2-9b-it-Q3_K_XL.gguf +2 -2
- gemma-2-9b-it-Q4_K_L.gguf +2 -2
- gemma-2-9b-it-Q4_K_M.gguf +2 -2
- gemma-2-9b-it-Q4_K_S.gguf +2 -2
- gemma-2-9b-it-Q5_K_L.gguf +2 -2
- gemma-2-9b-it-Q5_K_M.gguf +2 -2
- gemma-2-9b-it-Q5_K_S.gguf +2 -2
- gemma-2-9b-it-Q6_K.gguf +2 -2
- gemma-2-9b-it-Q6_K_L.gguf +2 -2
- gemma-2-9b-it-Q8_0.gguf +2 -2
- gemma-2-9b-it-Q8_0_L.gguf +2 -2
- gemma-2-9b-it-f32.gguf +2 -2
- gemma-2-9b-it.imatrix +1 -1
README.md
CHANGED
@@ -16,7 +16,7 @@ base_model: google/gemma-2-9b-it
|
|
16 |
|
17 |
## Llamacpp imatrix Quantizations of gemma-2-9b-it
|
18 |
|
19 |
-
Using <a href="https://github.com/ggerganov/llama.cpp/">llama.cpp</a> release <a href="https://github.com/ggerganov/llama.cpp/releases/tag/
|
20 |
|
21 |
Original model: https://huggingface.co/google/gemma-2-9b-it
|
22 |
|
@@ -25,9 +25,11 @@ All quants made using imatrix option with dataset from [here](https://gist.githu
|
|
25 |
## Prompt format
|
26 |
|
27 |
```
|
28 |
-
<start_of_turn>user
|
29 |
{prompt}<end_of_turn>
|
30 |
<start_of_turn>model
|
|
|
|
|
31 |
|
32 |
```
|
33 |
|
|
|
16 |
|
17 |
## Llamacpp imatrix Quantizations of gemma-2-9b-it
|
18 |
|
19 |
+
Using <a href="https://github.com/ggerganov/llama.cpp/">llama.cpp</a> release <a href="https://github.com/ggerganov/llama.cpp/releases/tag/b3266">b3266</a> for quantization.
|
20 |
|
21 |
Original model: https://huggingface.co/google/gemma-2-9b-it
|
22 |
|
|
|
25 |
## Prompt format
|
26 |
|
27 |
```
|
28 |
+
<bos><start_of_turn>user
|
29 |
{prompt}<end_of_turn>
|
30 |
<start_of_turn>model
|
31 |
+
<end_of_turn>
|
32 |
+
<start_of_turn>model
|
33 |
|
34 |
```
|
35 |
|
gemma-2-9b-it-IQ2_M.gguf
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:22f1598b84ff74b057ebbc772ff921b74d8ec2bfc04a46b0e012ba3a55ac88d5
|
3 |
+
size 3434669920
|
gemma-2-9b-it-IQ2_S.gguf
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aee7ef22832856ad1767627530028b325d85c6b0818e5ae8bcdcd7c9099d4085
|
3 |
+
size 3211487072
|
gemma-2-9b-it-IQ2_XS.gguf
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b1b7b3b9418dca6c7320c996fd309ff19b645b254cfd01d56dad45c3eda1191d
|
3 |
+
size 3067381600
|
gemma-2-9b-it-IQ3_M.gguf
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:264554168b51b3dbb416a994d4f4de761206e246f062dee7c5bfb75748eebcc5
|
3 |
+
size 4494616416
|
gemma-2-9b-it-IQ3_XS.gguf
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:40e8cd37cf20ef4439b8ca807f7d9a694baeabe544855fc36c3cb2a929c867f6
|
3 |
+
size 4144990048
|
gemma-2-9b-it-IQ3_XXS.gguf
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:57ae50cd71783cae22d80c1eed4578a12c0a33656b8a72454eb0aa7bac517d2c
|
3 |
+
size 3796739936
|
gemma-2-9b-it-IQ4_XS.gguf
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:717d862253259f2b9f8bae6dacfe2de4e548e07b681636abaccc5857cc64c539
|
3 |
+
size 5183031136
|
gemma-2-9b-it-Q2_K.gguf
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6bbc9bbfc3177d7c755469f513a26957a65daf267f50eea6b9ecf0aaa01e9824
|
3 |
+
size 3805398880
|
gemma-2-9b-it-Q2_K_L.gguf
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b449f7ab8849467305367a6b7954f1a7e38b1985d654c31074e5bf8138eb8978
|
3 |
+
size 4887766880
|
gemma-2-9b-it-Q3_K_L.gguf
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fdecc51155ec3257ad944b906fbdb6db956270796f8770a696fb4dd5360236c7
|
3 |
+
size 5132453728
|
gemma-2-9b-it-Q3_K_M.gguf
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9336a60687e668641ce713f04bc294393ad67f73eb67cd26d62d2d33c1fbb4e1
|
3 |
+
size 4761782112
|
gemma-2-9b-it-Q3_K_S.gguf
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dc1dbe1bb26875cc2e2e5198c366dd87d1656475c0fe081da99af1d1fbb5ada3
|
3 |
+
size 4337665888
|
gemma-2-9b-it-Q3_K_XL.gguf
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e89d15d86b6417353f2deefeafc9bc060f61d6a482c715f991e1be99d60f4148
|
3 |
+
size 6214821728
|
gemma-2-9b-it-Q4_K_L.gguf
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8bb3ad73320d4814c1935766f0b9eaf47de1f8672c6688080db2bfa400eab1ad
|
3 |
+
size 6843426656
|
gemma-2-9b-it-Q4_K_M.gguf
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c70fd20caec79fb953b83031c46ddea4e99905835a66af7b8a856aa1b2534614
|
3 |
+
size 5761058656
|
gemma-2-9b-it-Q4_K_S.gguf
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3c801ce6f8486ff5b6cdf958f2ecc75d0ba5a50626ac14d80a79d1434ef2e2ca
|
3 |
+
size 5478926176
|
gemma-2-9b-it-Q5_K_L.gguf
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:73ab83d6cc9e754af2c80bcf6009928c47d17813e7aa915d21062c4debfe8346
|
3 |
+
size 7729735520
|
gemma-2-9b-it-Q5_K_M.gguf
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f78d0bd3513fedd4ba55adb4e97ca744b37f46d42aca11d97dd57dd506a2fd50
|
3 |
+
size 6647367520
|
gemma-2-9b-it-Q5_K_S.gguf
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:77eb98f95812f1af5fa004cc4d6a1e5e1a63668ec2d8b71af59ab2df97b0ba28
|
3 |
+
size 6483593056
|
gemma-2-9b-it-Q6_K.gguf
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ac4ff889a8e5fb8a8844484a0a5d489a6352bf267c6f1e9e0e182ba5bc1970d7
|
3 |
+
size 7589070688
|
gemma-2-9b-it-Q6_K_L.gguf
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:864a9cade300574911946220d7db5fd1c37ab71101bbb4beedb6611a9cf23d61
|
3 |
+
size 8671438688
|
gemma-2-9b-it-Q8_0.gguf
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0d5ff18d06640d4f523cfcc2c699ac27165b0ce319d9894e7cd9771f77460c47
|
3 |
+
size 9827149664
|
gemma-2-9b-it-Q8_0_L.gguf
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:62ac7f5be275544048dbbde28db798864c1371fbdba24cc83ebb4f4c45ca21d9
|
3 |
+
size 10687309664
|
gemma-2-9b-it-f32.gguf
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eeab5ced5dd791e63b1bcee5823af35ce2fae0ca6438f0d788d4dd09b9d1fdc6
|
3 |
+
size 36972881504
|
gemma-2-9b-it.imatrix
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 6116901
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5e535b9f7be1305a997e288316242e42ccac1cf9810057c96bd6a194b3cc7495
|
3 |
size 6116901
|