{
  "$schema": "https://json-schema.org/draft/2020-12/schema",
  "title": "CompleteRequest",
  "type": "object",
  "description": "LLM text completion request.",
  "properties": {
    "model": {
      "type": "string",
      "description": "The model name. See documentation for possible values."
    },
    "messages": {
      "type": "array"
    },
    "temperature": {
      "type": "number",
      "description": "Temperature controls the amount of randomness used in response generation. A higher temperature corresponds to more randomness."
    },
    "top_p": {
      "type": "number",
      "description": "Threshold probability for nucleus sampling. A higher top-p value increases the diversity of tokens that the model considers, while a lower value results in more predictable output."
    },
    "max_tokens": {
      "type": "integer",
      "description": "The maximum number of output tokens to produce. The default value is model-dependent."
    },
    "max_output_tokens": {
      "type": "integer",
      "description": "Deprecated in favor of \"max_tokens\", which has identical behavior."
    },
    "response_format": {
      "type": "object",
      "description": "An object describing response format config for structured-output mode."
    },
    "tools": {
      "type": "array",
      "description": "List of tools to be used during tool calling"
    },
    "provisioned_throughput_id": {
      "type": "string",
      "description": "The provisioned throughput ID to be used with the request."
    },
    "sf-ml-xp-inflight-prompt-action": {
      "type": "string",
      "description": "Reserved"
    },
    "sf-ml-xp-inflight-prompt-client-id": {
      "type": "string",
      "description": "Reserved"
    },
    "sf-ml-xp-inflight-prompt-public-key": {
      "type": "string",
      "description": "Reserved"
    },
    "stream": {
      "type": "boolean",
      "description": "Reserved"
    }
  }
}