@@ -295,47 +295,47 @@ def _sample_top_p_top_k(
295
295
ctx = self .ctx ,
296
296
last_tokens_data = last_n_tokens_data ,
297
297
last_tokens_size = last_n_tokens_size ,
298
- candidates = llama_cpp .ctypes .pointer (candidates ),
298
+ candidates = llama_cpp .ctypes .byref (candidates ), # type: ignore
299
299
penalty = repeat_penalty ,
300
300
)
301
301
if float (temp .value ) == 0.0 :
302
302
return llama_cpp .llama_sample_token_greedy (
303
303
ctx = self .ctx ,
304
- candidates = llama_cpp .ctypes .pointer (candidates ),
304
+ candidates = llama_cpp .ctypes .byref (candidates ), # type: ignore
305
305
)
306
306
else :
307
307
llama_cpp .llama_sample_top_k (
308
308
ctx = self .ctx ,
309
- candidates = llama_cpp .ctypes .pointer (candidates ),
309
+ candidates = llama_cpp .ctypes .byref (candidates ), # type: ignore
310
310
k = top_k ,
311
311
min_keep = llama_cpp .c_size_t (1 ),
312
312
)
313
313
llama_cpp .llama_sample_tail_free (
314
314
ctx = self .ctx ,
315
- candidates = llama_cpp .ctypes .pointer (candidates ),
315
+ candidates = llama_cpp .ctypes .byref (candidates ), # type: ignore
316
316
z = llama_cpp .c_float (1.0 ),
317
317
min_keep = llama_cpp .c_size_t (1 ),
318
318
)
319
319
llama_cpp .llama_sample_typical (
320
320
ctx = self .ctx ,
321
- candidates = llama_cpp .ctypes .pointer (candidates ),
321
+ candidates = llama_cpp .ctypes .byref (candidates ), # type: ignore
322
322
p = llama_cpp .c_float (1.0 ),
323
323
min_keep = llama_cpp .c_size_t (1 ),
324
324
)
325
325
llama_cpp .llama_sample_top_p (
326
326
ctx = self .ctx ,
327
- candidates = llama_cpp .ctypes .pointer (candidates ),
327
+ candidates = llama_cpp .ctypes .byref (candidates ), # type: ignore
328
328
p = top_p ,
329
329
min_keep = llama_cpp .c_size_t (1 ),
330
330
)
331
331
llama_cpp .llama_sample_temperature (
332
332
ctx = self .ctx ,
333
- candidates = llama_cpp .ctypes .pointer (candidates ),
333
+ candidates = llama_cpp .ctypes .byref (candidates ), # type: ignore
334
334
temp = temp ,
335
335
)
336
336
return llama_cpp .llama_sample_token (
337
337
ctx = self .ctx ,
338
- candidates = llama_cpp .ctypes .pointer (candidates ),
338
+ candidates = llama_cpp .ctypes .byref (candidates ), # type: ignore
339
339
)
340
340
341
341
def sample (
0 commit comments