Skip to content

Commit

Permalink
[TRTLLM] always setting request output length (#1258)
Browse files Browse the repository at this point in the history
  • Loading branch information
Qing Lan authored Nov 3, 2023
1 parent bac045d commit 1d51b1f
Showing 1 changed file with 2 additions and 2 deletions.
Original file line number Diff line number Diff line change
Expand Up @@ -38,8 +38,8 @@ def reset(self):
super().reset()

def translate_triton_params(self, parameters):
if "max_new_tokens" in parameters.keys():
parameters["request_output_len"] = parameters.pop("max_new_tokens")
parameters["max_new_tokens"] = parameters.get("max_new_tokens", 128)
parameters["request_output_len"] = parameters.pop("max_new_tokens")
if "top_k" in parameters.keys():
parameters["runtime_top_k"] = parameters.pop("top_k")
if "top_p" in parameters.keys():
Expand Down

0 comments on commit 1d51b1f

Please sign in to comment.