Skip to content

Navigation Menu

Sign in
Appearance settings

Search code, repositories, users, issues, pull requests...

Provide feedback

We read every piece of feedback, and take your input very seriously.

Saved searches

Use saved searches to filter your results more quickly

Appearance settings

Commit 9558ce7

Browse filesBrowse files
committed
feat: Update llama.cpp
1 parent a57d5df commit 9558ce7
Copy full SHA for 9558ce7

File tree

Expand file treeCollapse file tree

1 file changed

+6
-2
lines changed
Filter options
Expand file treeCollapse file tree

1 file changed

+6
-2
lines changed

‎llama_cpp/llama_cpp.py

Copy file name to clipboardExpand all lines: llama_cpp/llama_cpp.py
+6-2Lines changed: 6 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -256,12 +256,14 @@ def byref(obj: CtypesCData, offset: Optional[int] = None) -> CtypesRef[CtypesCDa
256256
# LLAMA_FTYPE_MOSTLY_IQ2_XXS = 19, // except 1d tensors
257257
# LLAMA_FTYPE_MOSTLY_IQ2_XS = 20, // except 1d tensors
258258
# LLAMA_FTYPE_MOSTLY_Q2_K_S = 21, // except 1d tensors
259-
# LLAMA_FTYPE_MOSTLY_Q3_K_XS = 22, // except 1d tensors
259+
# LLAMA_FTYPE_MOSTLY_IQ3_XS = 22, // except 1d tensors
260260
# LLAMA_FTYPE_MOSTLY_IQ3_XXS = 23, // except 1d tensors
261261
# LLAMA_FTYPE_MOSTLY_IQ1_S = 24, // except 1d tensors
262262
# LLAMA_FTYPE_MOSTLY_IQ4_NL = 25, // except 1d tensors
263263
# LLAMA_FTYPE_MOSTLY_IQ3_S = 26, // except 1d tensors
264264
# LLAMA_FTYPE_MOSTLY_IQ3_M = 27, // except 1d tensors
265+
# LLAMA_FTYPE_MOSTLY_IQ2_S = 28, // except 1d tensors
266+
# LLAMA_FTYPE_MOSTLY_IQ2_M = 29, // except 1d tensors
265267

266268
# LLAMA_FTYPE_GUESSED = 1024, // not specified in the model file
267269
# };
@@ -285,12 +287,14 @@ def byref(obj: CtypesCData, offset: Optional[int] = None) -> CtypesRef[CtypesCDa
285287
LLAMA_FTYPE_MOSTLY_IQ2_XXS = 19
286288
LLAMA_FTYPE_MOSTLY_IQ2_XS = 20
287289
LLAMA_FTYPE_MOSTLY_Q2_K_S = 21
288-
LLAMA_FTYPE_MOSTLY_Q3_K_XS = 22
290+
LLAMA_FTYPE_MOSTLY_IQ3_XS = 22
289291
LLAMA_FTYPE_MOSTLY_IQ3_XXS = 23
290292
LLAMA_FTYPE_MOSTLY_IQ1_S = 24
291293
LLAMA_FTYPE_MOSTLY_IQ4_NL = 25
292294
LLAMA_FTYPE_MOSTLY_IQ3_S = 26
293295
LLAMA_FTYPE_MOSTLY_IQ3_M = 27
296+
LLAMA_FTYPE_MOSTLY_IQ2_S = 28
297+
LLAMA_FTYPE_MOSTLY_IQ2_M = 29
294298
LLAMA_FTYPE_GUESSED = 1024
295299

296300
# enum llama_rope_scaling_type {

0 commit comments

Comments
0 (0)
Morty Proxy This is a proxified and sanitized view of the page, visit original site.