Add alpha_value/compress_pos_emb to ExLlama-v2

This commit is contained in:
oobabooga 2023-09-12 15:02:47 -07:00
parent 90fca6a77d
commit 18e6b275f3
3 changed files with 10 additions and 0 deletions

View file

@ -45,11 +45,15 @@ loaders_and_params = OrderedDict({
'ExLlamav2': [
'gpu_split',
'max_seq_len',
'alpha_value',
'compress_pos_emb',
],
'ExLlamav2_HF': [
'gpu_split',
'max_seq_len',
'cfg_cache',
'alpha_value',
'compress_pos_emb',
],
'AutoGPTQ': [
'triton',