Bump ExLlamaV2 to 0.0.5 (#4186)
This commit is contained in:
parent
7ffb424c7b
commit
8a98646a21
11 changed files with 16 additions and 14 deletions
|
@ -110,7 +110,7 @@ class Exllamav2Model:
|
|||
has_leading_space = False
|
||||
for i in range(max_new_tokens):
|
||||
logits = self.model.forward(ids[:, -1:], self.cache, input_mask=None).float().cpu()
|
||||
token, _ = ExLlamaV2Sampler.sample(logits, settings, ids, random.random())
|
||||
token, _, _= ExLlamaV2Sampler.sample(logits, settings, ids, random.random(), self.tokenizer)
|
||||
ids = torch.cat([ids, token], dim=1)
|
||||
|
||||
if i == 0 and self.tokenizer.tokenizer.IdToPiece(int(token)).startswith('▁'):
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue