Pipeline

Pipeline

import requests

url = "https://platform.reducto.ai/pipeline"

payload = {
    "document_url": "<string>",
    "pipeline_id": "<string>"
}
headers = {
    "Authorization": "Bearer <token>",
    "Content-Type": "application/json"
}

response = requests.post(url, json=payload, headers=headers)

print(response.text)

{
  "job_id": "<string>",
  "usage": {
    "num_pages": 123,
    "credits": 123
  },
  "result": {
    "parse": {
      "job_id": "<string>",
      "duration": 123,
      "usage": {
        "num_pages": 123,
        "credits": 123
      },
      "result": {
        "type": "<string>",
        "chunks": [
          {
            "content": "<string>",
            "embed": "<string>",
            "enriched": "<string>",
            "blocks": [
              {
                "type": "Header",
                "bbox": {
                  "left": 123,
                  "top": 123,
                  "width": 123,
                  "height": 123,
                  "page": 123,
                  "original_page": 123
                },
                "content": "<string>",
                "image_url": "<string>",
                "confidence": "low",
                "granular_confidence": {
                  "extract_confidence": 123,
                  "parse_confidence": 123
                }
              }
            ],
            "enrichment_success": false
          }
        ],
        "ocr": {
          "words": [
            {
              "text": "<string>",
              "bbox": {
                "left": 123,
                "top": 123,
                "width": 123,
                "height": 123,
                "page": 123,
                "original_page": 123
              },
              "confidence": 123,
              "chunk_index": 123
            }
          ],
          "lines": [
            {
              "text": "<string>",
              "bbox": {
                "left": 123,
                "top": 123,
                "width": 123,
                "height": 123,
                "page": 123,
                "original_page": 123
              },
              "confidence": 123,
              "chunk_index": 123
            }
          ]
        },
        "custom": null
      },
      "pdf_url": "<string>",
      "studio_link": "<string>"
    },
    "extract": [
      {
        "split_name": "<string>",
        "page_range": [
          123
        ],
        "result": {
          "usage": {
            "num_pages": 123,
            "num_fields": 123,
            "credits": 123
          },
          "result": [
            "<unknown>"
          ],
          "citations": [
            "<unknown>"
          ],
          "job_id": "<string>",
          "studio_link": "<string>"
        },
        "partition": "<string>"
      }
    ],
    "split": {
      "usage": {
        "num_pages": 123,
        "credits": 123
      },
      "result": {
        "section_mapping": {},
        "splits": [
          {
            "name": "<string>",
            "pages": [
              123
            ],
            "conf": "low",
            "partitions": [
              {
                "name": "<string>",
                "pages": [
                  123
                ],
                "conf": "low"
              }
            ]
          }
        ]
      }
    },
    "edit": {
      "document_url": "<string>",
      "form_schema": [
        {
          "bbox": {
            "left": 123,
            "top": 123,
            "width": 123,
            "height": 123,
            "page": 123,
            "original_page": 123
          },
          "description": "<string>",
          "type": "text",
          "fill": true,
          "value": "<string>"
        }
      ]
    }
  }
}

POST

pipeline

Pipeline

import requests

url = "https://platform.reducto.ai/pipeline"

payload = {
    "document_url": "<string>",
    "pipeline_id": "<string>"
}
headers = {
    "Authorization": "Bearer <token>",
    "Content-Type": "application/json"
}

response = requests.post(url, json=payload, headers=headers)

print(response.text)

{
  "job_id": "<string>",
  "usage": {
    "num_pages": 123,
    "credits": 123
  },
  "result": {
    "parse": {
      "job_id": "<string>",
      "duration": 123,
      "usage": {
        "num_pages": 123,
        "credits": 123
      },
      "result": {
        "type": "<string>",
        "chunks": [
          {
            "content": "<string>",
            "embed": "<string>",
            "enriched": "<string>",
            "blocks": [
              {
                "type": "Header",
                "bbox": {
                  "left": 123,
                  "top": 123,
                  "width": 123,
                  "height": 123,
                  "page": 123,
                  "original_page": 123
                },
                "content": "<string>",
                "image_url": "<string>",
                "confidence": "low",
                "granular_confidence": {
                  "extract_confidence": 123,
                  "parse_confidence": 123
                }
              }
            ],
            "enrichment_success": false
          }
        ],
        "ocr": {
          "words": [
            {
              "text": "<string>",
              "bbox": {
                "left": 123,
                "top": 123,
                "width": 123,
                "height": 123,
                "page": 123,
                "original_page": 123
              },
              "confidence": 123,
              "chunk_index": 123
            }
          ],
          "lines": [
            {
              "text": "<string>",
              "bbox": {
                "left": 123,
                "top": 123,
                "width": 123,
                "height": 123,
                "page": 123,
                "original_page": 123
              },
              "confidence": 123,
              "chunk_index": 123
            }
          ]
        },
        "custom": null
      },
      "pdf_url": "<string>",
      "studio_link": "<string>"
    },
    "extract": [
      {
        "split_name": "<string>",
        "page_range": [
          123
        ],
        "result": {
          "usage": {
            "num_pages": 123,
            "num_fields": 123,
            "credits": 123
          },
          "result": [
            "<unknown>"
          ],
          "citations": [
            "<unknown>"
          ],
          "job_id": "<string>",
          "studio_link": "<string>"
        },
        "partition": "<string>"
      }
    ],
    "split": {
      "usage": {
        "num_pages": 123,
        "credits": 123
      },
      "result": {
        "section_mapping": {},
        "splits": [
          {
            "name": "<string>",
            "pages": [
              123
            ],
            "conf": "low",
            "partitions": [
              {
                "name": "<string>",
                "pages": [
                  123
                ],
                "conf": "low"
              }
            ]
          }
        ]
      }
    },
    "edit": {
      "document_url": "<string>",
      "form_schema": [
        {
          "bbox": {
            "left": 123,
            "top": 123,
            "width": 123,
            "height": 123,
            "page": 123,
            "original_page": 123
          },
          "description": "<string>",
          "type": "text",
          "fill": true,
          "value": "<string>"
        }
      ]
    }
  }
}

Authorizations

Authorization

string

header

required

Bearer authentication header of the form Bearer <token>, where <token> is your auth token.

Body

application/json

document_url

required

The URL of the document to be processed. You can provide one of the following: 1. A publicly available URL 2. A presigned S3 URL 3. A reducto:// prefixed URL obtained from the /upload endpoint after directly uploading a document

pipeline_id

string

required

The ID of the pipeline to use for the document.

Response

Successful Response

job_id

string

required

usage

ParseUsage · object

required

Show child attributes

result

PipelineResult · object

required

Show child attributes

Edit Async Pipeline Async

⌘I

Document Processing

Job Management

Utilities

Authorizations

Body

Response