Parameters: change max_new_tokens & repetition_penalty_range defaults (#4842)

This commit is contained in:
oobabooga 2023-12-07 20:04:52 -03:00 committed by GitHub
parent e16e5997ef
commit 2c5a1e67f9
No known key found for this signature in database
GPG key ID: 4AEE18F83AFDEB23
5 changed files with 5 additions and 5 deletions

View file

@ -236,7 +236,7 @@ def chat_completions_common(body: dict, is_legacy: bool = False, stream=False) -
max_tokens = generate_params['max_new_tokens']
if max_tokens in [None, 0]:
generate_params['max_new_tokens'] = 200
generate_params['max_new_tokens'] = 512
generate_params['auto_max_new_tokens'] = True
requested_model = generate_params.pop('model')