We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent f7d6ece commit 8d7ea9bCopy full SHA for 8d7ea9b
chat.go
@@ -320,6 +320,10 @@ type ChatCompletionRequest struct {
320
ChatTemplateKwargs map[string]any `json:"chat_template_kwargs,omitempty"`
321
// Specifies the latency tier to use for processing the request.
322
ServiceTier ServiceTier `json:"service_tier,omitempty"`
323
+ // Verbosity determines how many output tokens are generated.
324
+ // Lowering the number of tokens reduces overall latency.
325
+ // It can be set to "low", "medium", or "high".
326
+ Verbosity string `json:"verbosity,omitempty"`
327
// Embedded struct for non-OpenAI extensions
328
ChatCompletionRequestExtensions
329
}
0 commit comments