from retab import Retab
client = Retab()
# Split a multi-page document into sections based on categories
result = client.documents.split(
document="invoice_batch.pdf",
model="gemini-2.5-flash",
categories=[
{"name": "invoice", "description": "Invoice documents with billing information"},
{"name": "receipt", "description": "Receipt documents for payments"},
{"name": "contract", "description": "Legal contract documents"},
]
)
# Access split results
for split in result.splits:
print(f"{split.name}: pages {split.start_page}-{split.end_page}")
# Example output:
# invoice: pages 1-3
# receipt: pages 4-5
# invoice: pages 6-8