We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 7613d23 commit 66d5cddCopy full SHA for 66d5cdd
llama_cpp/server/model.py
@@ -223,6 +223,7 @@ def load_llama_from_model_settings(settings: ModelSettings) -> llama_cpp.Llama:
223
**kwargs,
224
# Model Params
225
n_gpu_layers=settings.n_gpu_layers,
226
+ split_mode=settings.split_mode,
227
main_gpu=settings.main_gpu,
228
tensor_split=settings.tensor_split,
229
vocab_only=settings.vocab_only,
0 commit comments