We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 08c87be commit 7bf4dcaCopy full SHA for 7bf4dca
src/triton_cli/templates/llmapi/1/model.py
@@ -142,6 +142,9 @@ def _get_sampling_config_from_request(self, request):
142
None if kwargs["top_p"] is None or kwargs["top_p"] <= 0 else kwargs["top_p"]
143
)
144
145
+ # Remove None values
146
+ kwargs = {k: v for k, v in kwargs.items() if v is not None}
147
+
148
return kwargs
149
150
@classmethod
@@ -244,6 +247,7 @@ def _auto_complete_inputs_and_outputs(auto_complete_model_config):
244
247
"name": "max_tokens",
245
248
"data_type": "TYPE_INT32",
246
249
"dims": [1],
250
+ "optional": True,
251
},
252
{
253
"name": "stop",
0 commit comments