Bump llama-cpp-python to 0.2.24 (#5001)
This commit is contained in:
parent
83cf1a6b67
commit
0a299d5959
15 changed files with 104 additions and 96 deletions
|
@ -86,6 +86,7 @@ class LlamaCppModel:
|
|||
'rope_freq_base': RoPE.get_rope_freq_base(shared.args.alpha_value, shared.args.rope_freq_base),
|
||||
'tensor_split': tensor_split_list,
|
||||
'rope_freq_scale': 1.0 / shared.args.compress_pos_emb,
|
||||
'offload_kqv': not shared.args.no_offload_kqv
|
||||
}
|
||||
|
||||
result.model = Llama(**params)
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue