> ## Documentation Index
> Fetch the complete documentation index at: https://docs.bigdata.com/llms.txt
> Use this file to discover all available pages before exploring further.

# Get document metadata

> Returns metadata for a single document by its content ID (the document id returned by List documents). Use this to check status, file_name, connector_id, tags, and timestamps. To retrieve the actual file content, use Get annotated document (structured JSON) or Get original document (original file format).



## OpenAPI

````yaml /api-rest/openapi/openapi_content_data.json get /contents/v1/documents/{content_id}
openapi: 3.1.0
info:
  title: Bigdata Content API
  description: API for managing and accessing private content documents uploaded by users.
  version: 1.0.0
servers:
  - url: https://api.bigdata.com/
security:
  - ApiKeyAuth: []
paths:
  /contents/v1/documents/{content_id}:
    get:
      tags:
        - Documents
      summary: Get document metadata
      description: >-
        Returns metadata for a single document by its content ID (the document
        id returned by List documents). Use this to check status, file_name,
        connector_id, tags, and timestamps. To retrieve the actual file content,
        use Get annotated document (structured JSON) or Get original document
        (original file format).
      parameters:
        - name: content_id
          in: path
          required: true
          description: >-
            Content ID of the document: a 32-character uppercase hexadecimal
            string (MD5-based identifier).
          schema:
            type: string
            pattern: ^[A-F0-9]{32}$
            example: E0618D0E9D3A960C1731A620EDE56B5C
      responses:
        '200':
          description: >-
            Document metadata (id, file_name, status, connector_id, tags, etc.).
            Use Get annotated document or Get original document with this id to
            download content.
          content:
            application/json:
              schema:
                $ref: '#/components/schemas/DocumentListItem'
              example:
                id: E0618D0E9D3A960C1731A620EDE56B5C
                file_name: Weekly summary report.eml
                user_id: user_id_001
                org_id: org_id_001
                rp_collection_id: 2CBDC7DA8AE42A8A078DECC3C9FCADFB
                raw_size: 18974
                request_origin: email
                content_type: message/rfc822
                status: completed
                shared_with_orgs:
                  - org_id_001
                created_at: '2026-02-03T08:43:02.729356Z'
                updated_at: '2026-02-03T08:43:02.729359Z'
                published_at: '2026-02-03T08:43:02.729359Z'
                connector_id: 019a9612-bfad-758c-884e-37dd8c6ad2cb
                error_code: null
                delete_started_ts: null
                file_metadata: null
                tags:
                  - id: 019a48b4-e574-71d9-a8d9-6a5a86386847
                    name: to:user@email.com
                  - id: 019a48b4-e573-7203-945a-2e7c4c164217
                    name: from:user@email.com
        '401':
          description: Unauthorized - Invalid or missing API key.
        '403':
          description: >-
            You do not have permission to access this document (e.g. not shared
            with your organization).
        '404':
          description: No document found with this content_id.
components:
  schemas:
    DocumentListItem:
      type: object
      description: >-
        Metadata for a single document. Returned by List documents and Get
        document. Use the id (content_id) with Get annotated document or Get
        original document to retrieve the file content.
      properties:
        id:
          type: string
          description: >-
            Content ID: unique 32-character uppercase hexadecimal identifier for
            the document. Use this when calling Get document, Get annotated
            document, or Get original document.
          example: E0618D0E9D3A960C1731A620EDE56B5C
        file_name:
          type: string
          description: Original file name of the uploaded document.
          example: Weekly summary report.eml
        user_id:
          type: string
          description: ID of the user who uploaded the document.
          example: user_id_001
        org_id:
          type: string
          description: ID of the organization the document belongs to.
          example: org_id_001
        rp_collection_id:
          type: string
          description: >-
            ID of the collection the document belongs to. This is applicable
            only for emails and attachments.
          example: 2CBDC7DA8AE42A8A078DECC3C9FCADFB
        raw_size:
          type: integer
          description: Size of the raw document in bytes.
          example: 18974
        request_origin:
          type: string
          description: >-
            Origin of the content ingestion request: how the document entered
            the platform.
          enum:
            - email
            - investment_research
            - file_upload
        content_type:
          type: string
          description: MIME type of the document.
          example: message/rfc822
        status:
          type: string
          description: Processing status of the document.
          enum:
            - pending
            - processing
            - completed
            - failed
        shared_with_orgs:
          type: array
          description: List of organization IDs the document is shared with.
          items:
            type: string
          example:
            - org_id_001
        created_at:
          type: string
          format: date-time
          description: Timestamp when the document was created.
          example: '2026-02-03T08:43:02.729356Z'
        updated_at:
          type: string
          format: date-time
          description: Timestamp when the document was last updated.
          example: '2026-02-03T08:43:02.729359Z'
        published_at:
          type: string
          format: date-time
          description: >-
            Timestamp when the document was published. This is the reference
            timestamp used for search and retrieval.
          example: '2026-02-03T08:43:02.729359Z'
        connector_id:
          type: string
          format: uuid
          description: ID of the connector used to upload the document.
          example: 019a9612-bfad-758c-884e-37dd8c6ad2cb
        error_code:
          type: string
          nullable: true
          description: Error code if the document processing failed.
          example: null
        delete_started_ts:
          type: string
          format: date-time
          nullable: true
          description: Timestamp when document deletion started, if applicable.
          example: null
        file_metadata:
          type: object
          nullable: true
          description: Additional metadata about the file.
          example: null
        tags:
          type: array
          description: Tags associated with the document.
          items:
            $ref: '#/components/schemas/Tag'
      required:
        - id
        - file_name
        - user_id
        - org_id
        - status
        - created_at
        - updated_at
        - published_at
    Tag:
      type: object
      description: A tag associated with a document.
      properties:
        id:
          type: string
          description: Unique identifier for the tag.
          example: 019a48b4-e574-71d9-a8d9-6a5a86386847
        name:
          type: string
          description: >-
            Name of the tag (e.g. `from:user@email.com` for email;
            `broker:Broker Name` for investment research).
          example: from:user@email.com
      required:
        - id
        - name
  securitySchemes:
    ApiKeyAuth:
      type: apiKey
      in: header
      name: X-API-KEY
      description: >-
        Your API key. Include it in every request as the X-API-KEY header.
        Create and manage keys in the Developer Platform.

````