Partition Document

curl --request POST \
  --url https://api.aryn.cloud/v1/document/partition \
  --header 'Authorization: Bearer <token>' \
  --header 'Content-Type: multipart/form-data' \
  --form file='@example-file' \
  --form 'file_url=<string>' \
  --form 'options={
  "selected_pages": [
    123
  ],
  "extract_images": false,
  "image_extraction_options": {
    "associate_captions": false,
    "extract_image_format": "ppm"
  },
  "property_extraction_options": {
    "schema": [
      {
        "name": "<string>",
        "type": {
          "type": "int",
          "description": "<string>",
          "examples": "<array>",
          "choices": [
            "<string>"
          ],
          "item_type": {}
        }
      }
    ],
    "voting": false,
    "suggest_properties": false,
    "suggest_properties_instructions": "<string>"
  },
  "table_extraction_options": {
    "include_additional_text": true,
    "model_selection": "pixels > 500 -> deformable_detr; table_transformer"
  },
  "summarize_images": false,
  "pipeline": "standard",
  "text_mode": "auto",
  "table_mode": "standard",
  "text_extraction_options": {
    "ocr_text_mode": "vision",
    "remove_line_breaks": true
  },
  "ocr_language": "english",
  "threshold": "auto",
  "chunking_options": {
    "strategy": "context_rich",
    "tokenizer": "openai_tokenizer",
    "tokenizer_options": {
      "model_name": "text-embedding-3-small"
    },
    "max_tokens": 123,
    "merge_across_pages": true
  },
  "output_format": "json",
  "output_label_options": {
    "title_candidate_elements": [
      "<string>"
    ],
    "promote_title": false,
    "orientation_correction": false
  },
  "markdown_options": {
    "include_pagenum": false,
    "include_headers": false,
    "include_footers": false
  },
  "extract_table_structure": true,
  "use_ocr": true,
  "extract_image_format": "ppm"
}'

{
  "status": [
    "<string>"
  ],
  "status_code": 123,
  "elements": [
    {
      "type": "<string>",
      "bbox": [
        123
      ],
      "properties": {},
      "text_representation": "<string>",
      "binary_representation": "<string>"
    }
  ],
  "markdown": "<string>",
  "error": "<string>"
}

POST

document

partition

Partition Document

curl --request POST \
  --url https://api.aryn.cloud/v1/document/partition \
  --header 'Authorization: Bearer <token>' \
  --header 'Content-Type: multipart/form-data' \
  --form file='@example-file' \
  --form 'file_url=<string>' \
  --form 'options={
  "selected_pages": [
    123
  ],
  "extract_images": false,
  "image_extraction_options": {
    "associate_captions": false,
    "extract_image_format": "ppm"
  },
  "property_extraction_options": {
    "schema": [
      {
        "name": "<string>",
        "type": {
          "type": "int",
          "description": "<string>",
          "examples": "<array>",
          "choices": [
            "<string>"
          ],
          "item_type": {}
        }
      }
    ],
    "voting": false,
    "suggest_properties": false,
    "suggest_properties_instructions": "<string>"
  },
  "table_extraction_options": {
    "include_additional_text": true,
    "model_selection": "pixels > 500 -> deformable_detr; table_transformer"
  },
  "summarize_images": false,
  "pipeline": "standard",
  "text_mode": "auto",
  "table_mode": "standard",
  "text_extraction_options": {
    "ocr_text_mode": "vision",
    "remove_line_breaks": true
  },
  "ocr_language": "english",
  "threshold": "auto",
  "chunking_options": {
    "strategy": "context_rich",
    "tokenizer": "openai_tokenizer",
    "tokenizer_options": {
      "model_name": "text-embedding-3-small"
    },
    "max_tokens": 123,
    "merge_across_pages": true
  },
  "output_format": "json",
  "output_label_options": {
    "title_candidate_elements": [
      "<string>"
    ],
    "promote_title": false,
    "orientation_correction": false
  },
  "markdown_options": {
    "include_pagenum": false,
    "include_headers": false,
    "include_footers": false
  },
  "extract_table_structure": true,
  "use_ocr": true,
  "extract_image_format": "ppm"
}'

{
  "status": [
    "<string>"
  ],
  "status_code": 123,
  "elements": [
    {
      "type": "<string>",
      "bbox": [
        123
      ],
      "properties": {},
      "text_representation": "<string>",
      "binary_representation": "<string>"
    }
  ],
  "markdown": "<string>",
  "error": "<string>"
}

Authorizations

Authorization

string

header

required

Bearer authentication header of the form Bearer <token>, where <token> is your auth token.

Headers

User-Agent

string | null

Body

multipart/form-data

file

file_url

string<url>

options

object

Show child attributes

Response

Successful Response

status

string[]

required

status_code

integer

required

elements

Element · object[] | null

required

Show child attributes

markdown

string | null

required

error

string | null

The error message if the partitioning is not successful.

Introduction Submit Document for Async Partitioning

⌘I

API Documentation

DocParse

Aryn Platform

Partition Document

Authorizations

Headers

Body

Response