{
  "$schema": "https://json-schema.org/draft/2020-12/schema",
  "$id": "https://raw.githubusercontent.com/api-evangelist/google-cloud-natural-language/refs/heads/main/json-schema/document-analysis.json",
  "title": "Document Analysis",
  "description": "Schema for a Google Cloud Natural Language document analysis request.",
  "type": "object",
  "required": ["document"],
  "properties": {
    "document": {
      "type": "object",
      "description": "The document to analyze.",
      "required": ["type"],
      "properties": {
        "type": {
          "type": "string",
          "enum": ["TYPE_UNSPECIFIED", "PLAIN_TEXT", "HTML"],
          "description": "The type of the document."
        },
        "content": {
          "type": "string",
          "description": "The content of the document as a string."
        },
        "gcsContentUri": {
          "type": "string",
          "description": "Google Cloud Storage URI for the document content."
        },
        "language": {
          "type": "string",
          "description": "BCP-47 language code of the document."
        }
      }
    },
    "features": {
      "type": "object",
      "description": "The features to enable for analysis.",
      "properties": {
        "extractSyntax": {
          "type": "boolean",
          "description": "Extract syntax information."
        },
        "extractEntities": {
          "type": "boolean",
          "description": "Extract entities."
        },
        "extractDocumentSentiment": {
          "type": "boolean",
          "description": "Extract document-level sentiment."
        },
        "extractEntitySentiment": {
          "type": "boolean",
          "description": "Extract entity-level sentiment."
        },
        "classifyText": {
          "type": "boolean",
          "description": "Classify the document into categories."
        }
      }
    },
    "encodingType": {
      "type": "string",
      "enum": ["NONE", "UTF8", "UTF16", "UTF32"],
      "description": "The encoding type for calculating offsets."
    }
  }
}