Add cache_8bit option
This commit is contained in:
parent
42f816312d
commit
c0655475ae
7 changed files with 32 additions and 5 deletions
|
@ -41,6 +41,8 @@ loaders_and_params = OrderedDict({
|
|||
'gpu_split',
|
||||
'max_seq_len',
|
||||
'cfg_cache',
|
||||
'no_flash_attn',
|
||||
'cache_8bit',
|
||||
'alpha_value',
|
||||
'compress_pos_emb',
|
||||
'use_fast',
|
||||
|
@ -56,6 +58,8 @@ loaders_and_params = OrderedDict({
|
|||
'ExLlamav2': [
|
||||
'gpu_split',
|
||||
'max_seq_len',
|
||||
'no_flash_attn',
|
||||
'cache_8bit',
|
||||
'alpha_value',
|
||||
'compress_pos_emb',
|
||||
],
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue