Bump llama-cpp-python, +tensor_split by @shouyiwang, +mul_mat_q (#3610)

This commit is contained in:
oobabooga 2023-08-18 12:03:34 -03:00 committed by GitHub
parent 4b69f4f6ae
commit 7cba000421
No known key found for this signature in database
GPG key ID: 4AEE18F83AFDEB23
8 changed files with 31 additions and 2 deletions

View file

@ -67,11 +67,13 @@ loaders_and_params = OrderedDict({
'n_gqa',
'rms_norm_eps',
'n_gpu_layers',
'tensor_split',
'n_batch',
'threads',
'no_mmap',
'low_vram',
'mlock',
'mul_mat_q',
'llama_cpp_seed',
'alpha_value',
'compress_pos_emb',
@ -82,11 +84,13 @@ loaders_and_params = OrderedDict({
'n_gqa',
'rms_norm_eps',
'n_gpu_layers',
'tensor_split',
'n_batch',
'threads',
'no_mmap',
'low_vram',
'mlock',
'mul_mat_q',
'alpha_value',
'compress_pos_emb',
'cpu',