Skip to content

Commit

Permalink
[TRTLLM] remove max_new_tokens since backend does not recognize it (#…
Browse files Browse the repository at this point in the history
  • Loading branch information
lanking520 committed Nov 7, 2023
1 parent d0bfe7e commit 62cf874
Showing 1 changed file with 2 additions and 2 deletions.
Original file line number Diff line number Diff line change
Expand Up @@ -38,8 +38,8 @@ def reset(self):
super().reset()

def translate_triton_params(self, parameters):
parameters["request_output_len"] = int(
parameters.get("max_new_tokens", 128))
parameters["max_new_tokens"] = parameters.get("max_new_tokens", 128)
parameters["request_output_len"] = parameters.pop("max_new_tokens")
if "top_k" in parameters.keys():
parameters["runtime_top_k"] = parameters.pop("top_k")
if "top_p" in parameters.keys():
Expand Down

0 comments on commit 62cf874

Please sign in to comment.