diff --git a/chat.go b/chat.go index 9719f6b92..06916114e 100644 --- a/chat.go +++ b/chat.go @@ -320,6 +320,10 @@ type ChatCompletionRequest struct { ChatTemplateKwargs map[string]any `json:"chat_template_kwargs,omitempty"` // Specifies the latency tier to use for processing the request. ServiceTier ServiceTier `json:"service_tier,omitempty"` + // Verbosity determines how many output tokens are generated. + // Lowering the number of tokens reduces overall latency. + // It can be set to "low", "medium", or "high". + Verbosity string `json:"verbosity,omitempty"` // A stable identifier used to help detect users of your application that may be violating OpenAI's usage policies. // The IDs should be a string that uniquely identifies each user. // We recommend hashing their username or email address, in order to avoid sending us any identifying information.