curl --request PUT \
--url https://api.tensorlake.ai/documents/v2/datasets/{dataset_id} \
--header 'Authorization: Bearer <token>' \
--header 'Content-Type: application/json' \
--data '{
"parsing_options": {
"table_output_mode": "html",
"table_parsing_format": "tsr",
"chunking_strategy": "none",
"signature_detection": false,
"remove_strikethrough_lines": false,
"skew_detection": false,
"disable_layout_detection": false,
"ignore_sections": [],
"cross_page_header_detection": false
},
"structured_extraction_options": [
{
"schema_name": "<string>",
"json_schema": "<any>",
"skip_ocr": true,
"prompt": "<string>",
"model_provider": "tensorlake",
"partition_strategy": "none",
"page_classes": [
"<string>"
]
}
],
"page_classifications": [
{
"name": "<string>",
"description": "<string>"
}
],
"enrichment_options": {
"table_summarization": false,
"table_summarization_prompt": null,
"figure_summarization": false,
"figure_summarization_prompt": null
},
"description": "This dataset contains all invoices from 2023."
}'