AutoAWQ: initial support (#3999)

This commit is contained in:
cal066 2023-10-05 16:19:18 +00:00 committed by GitHub
parent 3f56151f03
commit cc632c3f33
No known key found for this signature in database
GPG key ID: 4AEE18F83AFDEB23
8 changed files with 75 additions and 3 deletions

View file

@ -129,6 +129,16 @@ loaders_and_params = OrderedDict({
'model_type',
'no_mmap',
'mlock'
],
'AutoAWQ': [
'cpu_memory',
'gpu_memory',
'auto_devices',
'max_seq_len',
'n_batch',
'no_inject_fused_attention',
'trust_remote_code',
'use_fast',
]
})
@ -365,7 +375,40 @@ loaders_samplers = {
'top_k',
'repetition_penalty',
'repetition_penalty_range',
}
},
'AutoAWQ': {
'temperature',
'top_p',
'top_k',
'typical_p',
'epsilon_cutoff',
'eta_cutoff',
'tfs',
'top_a',
'repetition_penalty',
'repetition_penalty_range',
'encoder_repetition_penalty',
'no_repeat_ngram_size',
'min_length',
'seed',
'do_sample',
'penalty_alpha',
'num_beams',
'length_penalty',
'early_stopping',
'mirostat_mode',
'mirostat_tau',
'mirostat_eta',
'grammar_file_row',
'grammar_string',
'guidance_scale',
'negative_prompt',
'ban_eos_token',
'custom_token_bans',
'add_bos_token',
'skip_special_tokens',
'auto_max_new_tokens',
},
}
loaders_model_types = {