Disable logits_all in llamacpp_HF (makes processing 3x faster)
This commit is contained in:
parent
5c3eb22ce6
commit
af3d25a503
5 changed files with 5 additions and 1 deletions
|
@ -87,6 +87,7 @@ def list_model_elements():
|
|||
'alpha_value',
|
||||
'rope_freq_base',
|
||||
'numa',
|
||||
'logits_all',
|
||||
]
|
||||
if is_torch_xpu_available():
|
||||
for i in range(torch.xpu.device_count()):
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue