Skip to content

Commit 8d7ea9b

Browse files
committed
add verbosity param to ChatCompletionRequest
1 parent f7d6ece commit 8d7ea9b

File tree

1 file changed

+4
-0
lines changed

1 file changed

+4
-0
lines changed

chat.go

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -320,6 +320,10 @@ type ChatCompletionRequest struct {
320320
ChatTemplateKwargs map[string]any `json:"chat_template_kwargs,omitempty"`
321321
// Specifies the latency tier to use for processing the request.
322322
ServiceTier ServiceTier `json:"service_tier,omitempty"`
323+
// Verbosity determines how many output tokens are generated.
324+
// Lowering the number of tokens reduces overall latency.
325+
// It can be set to "low", "medium", or "high".
326+
Verbosity string `json:"verbosity,omitempty"`
323327
// Embedded struct for non-OpenAI extensions
324328
ChatCompletionRequestExtensions
325329
}

0 commit comments

Comments
 (0)