Revert "Add tensor split support for llama.cpp (#3171)"
This reverts commit 031fe7225e.
This commit is contained in:
parent
517d40cffe
commit
b17893a58f
6 changed files with 0 additions and 19 deletions
|
|
@ -94,12 +94,6 @@ class LlamacppHF(PreTrainedModel):
|
|||
model_file = list(path.glob('*ggml*.bin'))[0]
|
||||
|
||||
logger.info(f"llama.cpp weights detected: {model_file}\n")
|
||||
|
||||
if shared.args.tensor_split is None or shared.args.tensor_split.strip() == '':
|
||||
tensor_split_list = None
|
||||
else:
|
||||
tensor_split_list = [float(x) for x in shared.args.tensor_split.strip().split(",")]
|
||||
|
||||
params = {
|
||||
'model_path': str(model_file),
|
||||
'n_ctx': shared.args.n_ctx,
|
||||
|
|
@ -110,7 +104,6 @@ class LlamacppHF(PreTrainedModel):
|
|||
'use_mlock': shared.args.mlock,
|
||||
'low_vram': shared.args.low_vram,
|
||||
'n_gpu_layers': shared.args.n_gpu_layers,
|
||||
'tensor_split': tensor_split_list,
|
||||
'rope_freq_base': 10000 * shared.args.alpha_value ** (64/63.),
|
||||
'rope_freq_scale': 1.0 / shared.args.compress_pos_emb,
|
||||
'n_gqa': shared.args.n_gqa or None,
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue