Add --pin-weight parameter for FlexGen
This commit is contained in:
parent
05e703b4a4
commit
ed8b35efd2
2 changed files with 12 additions and 1 deletions
|
@ -58,7 +58,7 @@ def load_model(model_name):
|
|||
shared.args.percent[0], shared.args.percent[1],
|
||||
shared.args.percent[2], shared.args.percent[3],
|
||||
shared.args.percent[4], shared.args.percent[5],
|
||||
overlap=True, sep_layer=True, pin_weight=True,
|
||||
overlap=True, sep_layer=True, pin_weight=shared.args.pin_weight,
|
||||
cpu_cache_compute=False, attn_sparsity=1.0,
|
||||
compress_weight=shared.args.compress_weight,
|
||||
comp_weight_config=CompressionConfig(
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue