imotai
diff --git a/‎llama_cpp/llama.py
Copy file name to clipboardExpand all lines: llama_cpp/llama.py
+1-3Lines changed: 1 addition & 3 deletions b/‎llama_cpp/llama.py
Copy file name to clipboardExpand all lines: llama_cpp/llama.py
+1-3Lines changed: 1 addition & 3 deletions
diff --git a/‎llama_cpp/server/settings.py
Copy file name to clipboardExpand all lines: llama_cpp/server/settings.py
+1-1Lines changed: 1 addition & 1 deletion b/‎llama_cpp/server/settings.py
Copy file name to clipboardExpand all lines: llama_cpp/server/settings.py
+1-1Lines changed: 1 addition & 1 deletion
@@ -262,9 +262,7 @@ def __init__(
 
         self.n_batch = min(n_ctx, n_batch)  # ???
         self.n_threads = n_threads or max(multiprocessing.cpu_count() // 2, 1)
-        self.n_threads_batch = n_threads_batch or max(
-            multiprocessing.cpu_count() // 2, 1
-        )
+        self.n_threads_batch = n_threads_batch or multiprocessing.cpu_count()
 
         # Context Params
         self.context_params = llama_cpp.llama_context_default_params()
 
@@ -70,7 +70,7 @@ class ModelSettings(BaseSettings):
         description="The number of threads to use.",
     )
     n_threads_batch: int = Field(
-        default=max(multiprocessing.cpu_count() // 2, 1),
+        default=max(multiprocessing.cpu_count(), 1),
         ge=0,
         description="The number of threads to use when batch processing.",
     )
Original file line number	Diff line number	Diff line change
`@@ -70,7 +70,7 @@ class ModelSettings(BaseSettings):`
`70`	`70`	`description="The number of threads to use.",`
`71`	`71`	`)`
`72`	`72`	`n_threads_batch: int = Field(`
`73`		`- default=max(multiprocessing.cpu_count() // 2, 1),`
	`73`	`+ default=max(multiprocessing.cpu_count(), 1),`
`74`	`74`	`ge=0,`
`75`	`75`	`description="The number of threads to use when batch processing.",`
`76`	`76`	`)`