@@ -69,6 +69,9 @@ def __init__(
69
69
vocab_only : bool = False ,
70
70
use_mmap : bool = True ,
71
71
use_mlock : bool = False ,
72
+ check_tensors : bool = False ,
73
+ use_extra_bufts : bool = False ,
74
+ no_host : bool = False ,
72
75
kv_overrides : Optional [Dict [str , Union [bool , int , float , str ]]] = None ,
73
76
# Context Params
74
77
seed : int = llama_cpp .LLAMA_DEFAULT_SEED ,
@@ -156,6 +159,9 @@ def __init__(
156
159
vocab_only: Only load the vocabulary no weights.
157
160
use_mmap: Use mmap if possible.
158
161
use_mlock: Force the system to keep the model in RAM.
162
+ check_tensors: validate model tensor data
163
+ use_extra_bufts: use extra buffer types (used for weight repacking)
164
+ no_host: bypass host buffer allowing extra buffers to be used
159
165
kv_overrides: Key-value overrides for the model.
160
166
seed: RNG seed, -1 for random
161
167
n_ctx: Text context, 0 = from model
@@ -248,6 +254,9 @@ def __init__(
248
254
self .model_params .vocab_only = vocab_only
249
255
self .model_params .use_mmap = use_mmap if lora_path is None else False
250
256
self .model_params .use_mlock = use_mlock
257
+ self .model_params .check_tensors = check_tensors
258
+ self .model_params .use_extra_bufts = use_extra_bufts
259
+ self .model_params .no_host = no_host
251
260
252
261
# kv_overrides is the original python dict
253
262
self .kv_overrides = kv_overrides
@@ -2205,6 +2214,9 @@ def __getstate__(self):
2205
2214
vocab_only = self .model_params .vocab_only ,
2206
2215
use_mmap = self .model_params .use_mmap ,
2207
2216
use_mlock = self .model_params .use_mlock ,
2217
+ check_tensors = self .model_params .check_tensors ,
2218
+ use_extra_bufts = self .model_params .use_extra_bufts ,
2219
+ no_host = self .model_params .no_host ,
2208
2220
kv_overrides = self .kv_overrides ,
2209
2221
# Context Params
2210
2222
seed = self ._seed ,
0 commit comments