Add alpha_value/compress_pos_emb to ExLlama-v2

This commit is contained in:
oobabooga 2023-09-12 15:02:47 -07:00
parent 90fca6a77d
commit 18e6b275f3
3 changed files with 10 additions and 0 deletions

View file

@ -114,6 +114,9 @@ class Exllamav2HF(PreTrainedModel):
config = ExLlamaV2Config()
config.model_dir = pretrained_model_name_or_path
config.prepare()
config.max_seq_len = shared.args.max_seq_len
config.rope_scale = shared.args.compress_pos_emb
config.rope_alpha = shared.args.alpha_value
return Exllamav2HF(config)