Add ExLlamaV2 and ExLlamav2_HF loaders (#3881)

This commit is contained in:
oobabooga 2023-09-12 14:33:07 -03:00 committed by GitHub
parent a821928877
commit c2a309f56e
No known key found for this signature in database
GPG key ID: 4AEE18F83AFDEB23
9 changed files with 295 additions and 5 deletions

View file

@ -42,6 +42,15 @@ loaders_and_params = OrderedDict({
'compress_pos_emb',
'exllama_info',
],
'ExLlamav2': [
'gpu_split',
'max_seq_len',
],
'ExLlamav2_HF': [
'gpu_split',
'max_seq_len',
'cfg_cache',
],
'AutoGPTQ': [
'triton',
'no_inject_fused_attention',
@ -180,6 +189,42 @@ loaders_samplers = {
'ban_eos_token',
'auto_max_new_tokens',
},
'ExLlamav2': {
'temperature',
'top_p',
'top_k',
'repetition_penalty',
'repetition_penalty_range',
'seed',
'ban_eos_token',
'auto_max_new_tokens',
},
'ExLlamav2_HF': {
'temperature',
'top_p',
'top_k',
'typical_p',
'epsilon_cutoff',
'eta_cutoff',
'tfs',
'top_a',
'repetition_penalty',
'repetition_penalty_range',
'encoder_repetition_penalty',
'no_repeat_ngram_size',
'min_length',
'seed',
'do_sample',
'mirostat_mode',
'mirostat_tau',
'mirostat_eta',
'guidance_scale',
'negative_prompt',
'ban_eos_token',
'add_bos_token',
'skip_special_tokens',
'auto_max_new_tokens',
},
'AutoGPTQ': {
'temperature',
'top_p',