Add alpha_value/compress_pos_emb to ExLlama-v2
This commit is contained in:
parent
90fca6a77d
commit
18e6b275f3
3 changed files with 10 additions and 0 deletions
|
@ -45,11 +45,15 @@ loaders_and_params = OrderedDict({
|
|||
'ExLlamav2': [
|
||||
'gpu_split',
|
||||
'max_seq_len',
|
||||
'alpha_value',
|
||||
'compress_pos_emb',
|
||||
],
|
||||
'ExLlamav2_HF': [
|
||||
'gpu_split',
|
||||
'max_seq_len',
|
||||
'cfg_cache',
|
||||
'alpha_value',
|
||||
'compress_pos_emb',
|
||||
],
|
||||
'AutoGPTQ': [
|
||||
'triton',
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue