Add --num_experts_per_token parameter (ExLlamav2) (#4955)

This commit is contained in:
oobabooga 2023-12-17 12:08:33 -03:00 committed by GitHub
parent 12690d3ffc
commit f1f2c4c3f4
No known key found for this signature in database
GPG key ID: 4AEE18F83AFDEB23
7 changed files with 28 additions and 20 deletions

View file

@ -73,6 +73,7 @@ def list_model_elements():
'disable_exllamav2',
'cfg_cache',
'no_flash_attn',
'num_experts_per_token',
'cache_8bit',
'threads',
'threads_batch',