ExLlama with long context (#2875)

2023-06-25 22:49:26 -03:00 · 2023-06-25 22:49:26 -03:00 · c52290de50
commit c52290de50
parent 9290c6236f
14 changed files with 22 additions and 25 deletions
--- a/models/config.yaml
+++ b/models/config.yaml
@ -104,12 +104,8 @@ llama-65b-gptq-3bit:
  mode: 'instruct'
  instruction_template: 'StableLM'
  truncation_length: 4096
-  chat_prompt_size: 4096
-  chat_prompt_size_max: 4096
 .*stablelm-base:
  truncation_length: 4096
-  chat_prompt_size: 4096
-  chat_prompt_size_max: 4096
 .*wizardlm:
  mode: 'instruct'
  model_type: 'llama'
@ -237,8 +233,6 @@ TheBloke_WizardLM-30B-GPTQ:
  instruction_template: 'Minotaur'
 .*minotaur-15b:
  truncation_length: 8192
-  chat_prompt_size: 8192
-  chat_prompt_size_max: 8192
 .*orca_mini:
  mode: 'instruct'
  instruction_template: 'Orca Mini'