Bump llama-cpp-python to 0.2.24 (#5001)

This commit is contained in:
oobabooga 2023-12-19 15:22:21 -03:00 committed by GitHub
parent 83cf1a6b67
commit 0a299d5959
No known key found for this signature in database
GPG key ID: 4AEE18F83AFDEB23
15 changed files with 104 additions and 96 deletions

View file

@ -204,6 +204,7 @@ class LlamacppHF(PreTrainedModel):
'tensor_split': tensor_split_list,
'rope_freq_scale': 1.0 / shared.args.compress_pos_emb,
'logits_all': shared.args.logits_all,
'offload_kqv': not shared.args.no_offload_kqv
}
Llama = llama_cpp_lib().Llama