File tree Expand file tree Collapse file tree 2 files changed +8
-0
lines changed
Filter options
Expand file tree Collapse file tree 2 files changed +8
-0
lines changed
Original file line number Diff line number Diff line change @@ -227,6 +227,7 @@ def __init__(
227
227
rope_freq_scale : float = 1.0 ,
228
228
n_gqa : Optional [int ] = None , # (TEMPORARY) must be 8 for llama2 70b
229
229
rms_norm_eps : Optional [float ] = None , # (TEMPORARY)
230
+ mul_mat_q : Optional (bool ) = None , # (TEMPORARY)
230
231
verbose : bool = True ,
231
232
):
232
233
"""Load a llama.cpp model from `model_path`.
@@ -293,6 +294,9 @@ def __init__(
293
294
if rms_norm_eps is not None :
294
295
self .params .rms_norm_eps = rms_norm_eps
295
296
297
+ if mul_mat_q is not None :
298
+ self .params .mul_mat_q = mul_mat_q
299
+
296
300
self .last_n_tokens_size = last_n_tokens_size
297
301
self .n_batch = min (n_ctx , n_batch )
298
302
Original file line number Diff line number Diff line change @@ -103,6 +103,10 @@ class Settings(BaseSettings):
103
103
default = None ,
104
104
description = "TEMPORARY" ,
105
105
)
106
+ mul_mat_q : Optional [bool ] = Field (
107
+ default = None ,
108
+ description = "TEMPORARY" ,
109
+ )
106
110
107
111
108
112
class ErrorResponse (TypedDict ):
You can’t perform that action at this time.
0 commit comments