Split - Reducto API

Split

import requests

url = "https://platform.reducto.ai/split"

payload = {
    "options": {
        "ocr_mode": "standard",
        "extraction_mode": "ocr",
        "chunking": {"chunk_mode": "variable"},
        "table_summary": {"enabled": False},
        "figure_summary": {
            "enabled": False,
            "override": False
        },
        "filter_blocks": [],
        "force_url_result": False
    },
    "advanced_options": {
        "ocr_system": "highres",
        "table_output_format": "html",
        "merge_tables": False,
        "continue_hierarchy": True,
        "keep_line_breaks": False,
        "page_range": {},
        "large_table_chunking": {
            "enabled": True,
            "size": 50
        },
        "spreadsheet_table_clustering": "default",
        "add_page_markers": False,
        "remove_text_formatting": False,
        "return_ocr_data": False,
        "filter_line_numbers": False,
        "read_comments": False,
        "persist_results": False,
        "exclude_hidden_sheets": False,
        "exclude_hidden_rows_cols": False,
        "enable_change_tracking": False
    },
    "experimental_options": {
        "enrich": {
            "enabled": False,
            "mode": "standard"
        },
        "native_office_conversion": False,
        "enable_checkboxes": False,
        "enable_equations": False,
        "rotate_pages": True,
        "rotate_figures": False,
        "enable_scripts": False,
        "return_figure_images": False,
        "return_table_images": False,
        "layout_model": "default",
        "embed_text_metadata_pdf": False,
        "danger_filter_wide_boxes": False
    },
    "document_url": "<string>",
    "priority": True,
    "split_description": [
        {
            "name": "<string>",
            "description": "<string>",
            "partition_key": "<string>"
        }
    ],
    "split_rules": "Split the document into the applicable sections. Sections may only overlap at their first and last page if at all."
}
headers = {
    "Authorization": "Bearer <token>",
    "Content-Type": "application/json"
}

response = requests.request("POST", url, json=payload, headers=headers)

print(response.text)

{
  "usage": {
    "num_pages": 123,
    "credits": 123
  },
  "result": {
    "section_mapping": {},
    "splits": [
      {
        "name": "<string>",
        "pages": [
          123
        ],
        "conf": "low",
        "partitions": [
          {
            "name": "<string>",
            "pages": [
              123
            ],
            "conf": "low"
          }
        ]
      }
    ]
  }
}

POST

split

Split

import requests

url = "https://platform.reducto.ai/split"

payload = {
    "options": {
        "ocr_mode": "standard",
        "extraction_mode": "ocr",
        "chunking": {"chunk_mode": "variable"},
        "table_summary": {"enabled": False},
        "figure_summary": {
            "enabled": False,
            "override": False
        },
        "filter_blocks": [],
        "force_url_result": False
    },
    "advanced_options": {
        "ocr_system": "highres",
        "table_output_format": "html",
        "merge_tables": False,
        "continue_hierarchy": True,
        "keep_line_breaks": False,
        "page_range": {},
        "large_table_chunking": {
            "enabled": True,
            "size": 50
        },
        "spreadsheet_table_clustering": "default",
        "add_page_markers": False,
        "remove_text_formatting": False,
        "return_ocr_data": False,
        "filter_line_numbers": False,
        "read_comments": False,
        "persist_results": False,
        "exclude_hidden_sheets": False,
        "exclude_hidden_rows_cols": False,
        "enable_change_tracking": False
    },
    "experimental_options": {
        "enrich": {
            "enabled": False,
            "mode": "standard"
        },
        "native_office_conversion": False,
        "enable_checkboxes": False,
        "enable_equations": False,
        "rotate_pages": True,
        "rotate_figures": False,
        "enable_scripts": False,
        "return_figure_images": False,
        "return_table_images": False,
        "layout_model": "default",
        "embed_text_metadata_pdf": False,
        "danger_filter_wide_boxes": False
    },
    "document_url": "<string>",
    "priority": True,
    "split_description": [
        {
            "name": "<string>",
            "description": "<string>",
            "partition_key": "<string>"
        }
    ],
    "split_rules": "Split the document into the applicable sections. Sections may only overlap at their first and last page if at all."
}
headers = {
    "Authorization": "Bearer <token>",
    "Content-Type": "application/json"
}

response = requests.request("POST", url, json=payload, headers=headers)

print(response.text)

{
  "usage": {
    "num_pages": 123,
    "credits": 123
  },
  "result": {
    "section_mapping": {},
    "splits": [
      {
        "name": "<string>",
        "pages": [
          123
        ],
        "conf": "low",
        "partitions": [
          {
            "name": "<string>",
            "pages": [
              123
            ],
            "conf": "low"
          }
        ]
      }
    ]
  }
}

Authorizations

Authorization

string

header

required

Bearer authentication header of the form Bearer <token>, where <token> is your auth token.

Body

application/json

Response

200

application/json

Successful Response

The response is of type object.

Split Async

API Reference

Authorizations

Body

Response