From bafd90fd85d4488e5244e7025c748bd6c5f4d648 Mon Sep 17 00:00:00 2001 From: speakeasybot Date: Fri, 28 Mar 2025 19:02:07 +0000 Subject: [PATCH] ci: regenerated with OpenAPI Doc , Speakeasy CLI 1.526.0 --- .speakeasy/gen.lock | 14 +++---- .speakeasy/workflow.lock | 16 ++++---- RELEASES.md | 12 +++++- codeSamples.yaml | 4 +- .../shared/astradbconnectorconfiginput.md | 1 + .../shared/confluencesourceconnectorconfig.md | 4 +- .../confluencesourceconnectorconfiginput.md | 4 +- .../shared/jirasourceconnectorconfig.md | 6 +-- .../shared/jirasourceconnectorconfiginput.md | 6 +-- docs/models/shared/partitionparameters.md | 4 ++ .../shared/sharepointsourceconnectorconfig.md | 3 ++ .../sharepointsourceconnectorconfiginput.md | 3 ++ .../snowflakedestinationconnectorconfig.md | 4 +- ...nowflakedestinationconnectorconfiginput.md | 4 +- .../shared/snowflakesourceconnectorconfig.md | 4 +- .../snowflakesourceconnectorconfiginput.md | 4 +- gen.yaml | 2 +- pyproject.toml | 2 +- src/unstructured_client/_version.py | 8 ++-- src/unstructured_client/destinations.py | 20 +++++----- src/unstructured_client/jobs.py | 16 ++++---- .../shared/astradbconnectorconfiginput.py | 5 ++- .../shared/confluencesourceconnectorconfig.py | 13 ++++-- .../confluencesourceconnectorconfiginput.py | 14 +++++-- .../shared/createdestinationconnector.py | 4 +- .../models/shared/createsourceconnector.py | 16 ++++---- .../shared/jirasourceconnectorconfig.py | 13 +++--- .../shared/jirasourceconnectorconfiginput.py | 13 +++--- .../models/shared/partition_parameters.py | 40 +++++++++++++++++++ .../shared/sharepointsourceconnectorconfig.py | 12 +++++- .../sharepointsourceconnectorconfiginput.py | 11 ++++- .../snowflakedestinationconnectorconfig.py | 9 +++-- ...nowflakedestinationconnectorconfiginput.py | 8 ++-- .../shared/snowflakesourceconnectorconfig.py | 10 ++--- .../snowflakesourceconnectorconfiginput.py | 8 ++-- .../shared/sourceconnectorinformation.py | 12 +++--- .../shared/updatedestinationconnector.py | 4 +- .../models/shared/updatesourceconnector.py | 16 ++++---- src/unstructured_client/sources.py | 20 +++++----- src/unstructured_client/workflows.py | 24 +++++------ 40 files changed, 249 insertions(+), 144 deletions(-) diff --git a/.speakeasy/gen.lock b/.speakeasy/gen.lock index 4862a489..701bc124 100755 --- a/.speakeasy/gen.lock +++ b/.speakeasy/gen.lock @@ -1,12 +1,12 @@ lockVersion: 2.0.0 id: 8b5fa338-9106-4734-abf0-e30d67044a90 management: - docChecksum: c919f9a5fe1fffc0fe08d9ba771fdf37 - docVersion: 1.0.81 - speakeasyVersion: 1.525.1 - generationVersion: 2.562.2 - releaseVersion: 0.31.6 - configChecksum: 4c2dbab9c89a9d2312d8d54a2c3fef88 + docChecksum: 82d55672df290a1b6b3641bf1c0385a0 + docVersion: 1.1.4 + speakeasyVersion: 1.526.0 + generationVersion: 2.563.0 + releaseVersion: 0.32.0 + configChecksum: aaffd2f8109b46337a8b440562051f7a repoURL: https://github.com/Unstructured-IO/unstructured-python-client.git repoSubDirectory: . installationURL: https://github.com/Unstructured-IO/unstructured-python-client.git @@ -566,7 +566,7 @@ examples: partition: speakeasy-default-partition: requestBody: - multipart/form-data: {"chunking_strategy": "by_title", "combine_under_n_chars": null, "content_type": null, "coordinates": false, "encoding": null, "files": {"": "{\"summary\":\"File to be partitioned\",\"externalValue\":\"https://github.com/Unstructured-IO/unstructured/blob/98d3541909f64290b5efb65a226fc3ee8a7cc5ee/example-docs/layout-parser-paper.pdf\"}"}, "gz_uncompressed_content_type": null, "hi_res_model_name": null, "include_orig_elements": null, "include_page_breaks": false, "include_slide_notes": true, "max_characters": null, "multipage_sections": true, "new_after_n_chars": null, "output_format": "application/json", "overlap": 0, "overlap_all": false, "pdf_infer_table_structure": true, "similarity_threshold": null, "split_pdf_allow_failed": false, "split_pdf_cache_tmp_data": false, "split_pdf_cache_tmp_data_dir": "", "split_pdf_concurrency_level": 5, "split_pdf_page": true, "split_pdf_page_range": [1, 10], "starting_page_number": null, "strategy": "vlm", "table_ocr_agent": null, "unique_element_ids": false, "vlm_model": "gpt-4o", "vlm_model_provider": "openai", "xml_keep_tags": false} + multipart/form-data: {"chunking_strategy": "by_title", "combine_under_n_chars": null, "content_type": null, "coordinates": false, "encoding": null, "files": {"": "{\"summary\":\"File to be partitioned\",\"externalValue\":\"https://github.com/Unstructured-IO/unstructured/blob/98d3541909f64290b5efb65a226fc3ee8a7cc5ee/example-docs/layout-parser-paper.pdf\"}"}, "gz_uncompressed_content_type": null, "hi_res_model_name": null, "include_orig_elements": null, "include_page_breaks": false, "include_slide_notes": true, "max_characters": null, "multipage_sections": true, "new_after_n_chars": null, "output_format": "application/json", "overlap": 0, "overlap_all": false, "pdf_infer_table_structure": true, "pdfminer_char_margin": null, "pdfminer_line_margin": null, "pdfminer_line_overlap": null, "pdfminer_word_margin": null, "similarity_threshold": null, "split_pdf_allow_failed": false, "split_pdf_cache_tmp_data": false, "split_pdf_cache_tmp_data_dir": "", "split_pdf_concurrency_level": 5, "split_pdf_page": true, "split_pdf_page_range": [1, 10], "starting_page_number": null, "strategy": "vlm", "table_ocr_agent": null, "unique_element_ids": false, "vlm_model": "gpt-4o", "vlm_model_provider": "openai", "xml_keep_tags": false} responses: "200": application/json: [{"type": "Title", "element_id": "6aa0ff22f91bbe7e26e8e25ca8052acd", "text": "LayoutParser: A Unified Toolkit for Deep Learning Based Document Image Analysis", "metadata": {"languages": ["eng"], "page_number": 1, "filename": "layout-parser-paper.pdf", "filetype": "application/pdf"}}] diff --git a/.speakeasy/workflow.lock b/.speakeasy/workflow.lock index 00db8f67..e562784c 100644 --- a/.speakeasy/workflow.lock +++ b/.speakeasy/workflow.lock @@ -1,21 +1,21 @@ -speakeasyVersion: 1.525.1 +speakeasyVersion: 1.526.0 sources: my-source: sourceNamespace: my-source - sourceRevisionDigest: sha256:8cefa2db4e0071ffc9ae499d113126153c720616d0f065d3cfd8d0130d695c14 - sourceBlobDigest: sha256:bbe20a8c95ddaf534208edebea334f221fa91acaff2ae00525987715bd36b943 + sourceRevisionDigest: sha256:b7ee9aa59b47e0b739012e611720330b6870798eb256e44c15d0c55832dc1207 + sourceBlobDigest: sha256:19ebaffb7c44a42ce3fbdf03cf5fe0f4a68956d59d6f3239d8b6a5b16e1c07e5 tags: - latest - - speakeasy-sdk-regen-1743108088 - - 1.0.81 + - speakeasy-sdk-regen-1743188464 + - 1.1.4 targets: unstructured-python: source: my-source sourceNamespace: my-source - sourceRevisionDigest: sha256:8cefa2db4e0071ffc9ae499d113126153c720616d0f065d3cfd8d0130d695c14 - sourceBlobDigest: sha256:bbe20a8c95ddaf534208edebea334f221fa91acaff2ae00525987715bd36b943 + sourceRevisionDigest: sha256:b7ee9aa59b47e0b739012e611720330b6870798eb256e44c15d0c55832dc1207 + sourceBlobDigest: sha256:19ebaffb7c44a42ce3fbdf03cf5fe0f4a68956d59d6f3239d8b6a5b16e1c07e5 codeSamplesNamespace: my-source-code-samples - codeSamplesRevisionDigest: sha256:974e4d48d27a10c9be80ec289dc9dbf7903b32a4ac7f0c6821c8224e52b93799 + codeSamplesRevisionDigest: sha256:0696c1f0b1f0274a950cd103dd855cc721ada1716468d57138e7370f7f7e9ea4 workflow: workflowVersion: 1.0.0 speakeasyVersion: latest diff --git a/RELEASES.md b/RELEASES.md index 2ef350c1..8bec9b26 100644 --- a/RELEASES.md +++ b/RELEASES.md @@ -905,4 +905,14 @@ Based on: ### Generated - [python v0.31.6] . ### Releases -- [PyPI v0.31.6] https://pypi.org/project/unstructured-client/0.31.6 - . \ No newline at end of file +- [PyPI v0.31.6] https://pypi.org/project/unstructured-client/0.31.6 - . + +## 2025-03-28 19:00:48 +### Changes +Based on: +- OpenAPI Doc +- Speakeasy CLI 1.526.0 (2.563.0) https://github.com/speakeasy-api/speakeasy +### Generated +- [python v0.32.0] . +### Releases +- [PyPI v0.32.0] https://pypi.org/project/unstructured-client/0.32.0 - . \ No newline at end of file diff --git a/codeSamples.yaml b/codeSamples.yaml index e9e98aee..2503dd7f 100644 --- a/codeSamples.yaml +++ b/codeSamples.yaml @@ -14,7 +14,7 @@ actions: "x-codeSamples": - "lang": "python" "label": "create_destination" - "source": "from unstructured_client import UnstructuredClient\nfrom unstructured_client.models import shared\n\n\nwith UnstructuredClient() as uc_client:\n\n res = uc_client.destinations.create_destination(request={\n \"create_destination_connector\": {\n \"name\": \"\",\n \"type\": shared.DestinationConnectorType.AZURE_AI_SEARCH,\n \"config\": {\n \"collection_name\": \"\",\n \"batch_size\": 20,\n \"api_endpoint\": \"\",\n \"token\": \"\",\n },\n },\n })\n\n assert res.destination_connector_information is not None\n\n # Handle response\n print(res.destination_connector_information)" + "source": "from unstructured_client import UnstructuredClient\nfrom unstructured_client.models import shared\n\n\nwith UnstructuredClient() as uc_client:\n\n res = uc_client.destinations.create_destination(request={\n \"create_destination_connector\": {\n \"name\": \"\",\n \"type\": shared.DestinationConnectorType.AZURE_AI_SEARCH,\n \"config\": {\n \"collection_name\": \"\",\n \"batch_size\": 20,\n \"api_endpoint\": \"\",\n \"token\": \"\",\n \"flatten_metadata\": False,\n },\n },\n })\n\n assert res.destination_connector_information is not None\n\n # Handle response\n print(res.destination_connector_information)" - target: $["paths"]["/api/v1/destinations/{destination_id}"]["delete"] update: "x-codeSamples": @@ -68,7 +68,7 @@ actions: "x-codeSamples": - "lang": "python" "label": "create_source" - "source": "from unstructured_client import UnstructuredClient\nfrom unstructured_client.models import shared\n\n\nwith UnstructuredClient() as uc_client:\n\n res = uc_client.sources.create_source(request={\n \"create_source_connector\": {\n \"name\": \"\",\n \"type\": shared.SourceConnectorType.SHAREPOINT,\n \"config\": {\n \"account\": \"21158540\",\n \"role\": \"\",\n \"user\": \"Andrew_Ebert71\",\n \"password\": \"RKAX3jUtlnjWe9D\",\n \"host\": \"impractical-academics.net\",\n \"port\": 443,\n \"database\": \"\",\n \"schema_\": \"\",\n \"table_name\": \"\",\n \"batch_size\": 100,\n \"id_column\": \"\",\n },\n },\n })\n\n assert res.source_connector_information is not None\n\n # Handle response\n print(res.source_connector_information)" + "source": "from unstructured_client import UnstructuredClient\nfrom unstructured_client.models import shared\n\n\nwith UnstructuredClient() as uc_client:\n\n res = uc_client.sources.create_source(request={\n \"create_source_connector\": {\n \"name\": \"\",\n \"type\": shared.SourceConnectorType.SHAREPOINT,\n \"config\": {\n \"account\": \"21158540\",\n \"role\": \"\",\n \"user\": \"Andrew_Ebert71\",\n \"password\": \"RKAX3jUtlnjWe9D\",\n \"host\": \"impractical-academics.net\",\n \"port\": 443,\n \"database\": \"\",\n \"table_name\": \"\",\n \"batch_size\": 100,\n \"id_column\": \"\",\n },\n },\n })\n\n assert res.source_connector_information is not None\n\n # Handle response\n print(res.source_connector_information)" - target: $["paths"]["/api/v1/sources/{source_id}"]["delete"] update: "x-codeSamples": diff --git a/docs/models/shared/astradbconnectorconfiginput.md b/docs/models/shared/astradbconnectorconfiginput.md index 81181439..77d1eb54 100644 --- a/docs/models/shared/astradbconnectorconfiginput.md +++ b/docs/models/shared/astradbconnectorconfiginput.md @@ -9,4 +9,5 @@ | `collection_name` | *str* | :heavy_check_mark: | N/A | | `token` | *str* | :heavy_check_mark: | N/A | | `batch_size` | *Optional[int]* | :heavy_minus_sign: | N/A | +| `flatten_metadata` | *Optional[bool]* | :heavy_minus_sign: | N/A | | `keyspace` | *OptionalNullable[str]* | :heavy_minus_sign: | N/A | \ No newline at end of file diff --git a/docs/models/shared/confluencesourceconnectorconfig.md b/docs/models/shared/confluencesourceconnectorconfig.md index da78a529..7eb75dca 100644 --- a/docs/models/shared/confluencesourceconnectorconfig.md +++ b/docs/models/shared/confluencesourceconnectorconfig.md @@ -8,8 +8,10 @@ | `cloud` | *bool* | :heavy_check_mark: | N/A | | `max_num_of_docs_from_each_space` | *int* | :heavy_check_mark: | N/A | | `max_num_of_spaces` | *int* | :heavy_check_mark: | N/A | -| `spaces` | *Nullable[str]* | :heavy_check_mark: | N/A | +| `spaces` | List[*str*] | :heavy_check_mark: | N/A | | `url` | *str* | :heavy_check_mark: | N/A | | `username` | *str* | :heavy_check_mark: | N/A | +| `extract_files` | *Optional[bool]* | :heavy_minus_sign: | N/A | +| `extract_images` | *Optional[bool]* | :heavy_minus_sign: | N/A | | `password` | *OptionalNullable[str]* | :heavy_minus_sign: | N/A | | `token` | *OptionalNullable[str]* | :heavy_minus_sign: | N/A | \ No newline at end of file diff --git a/docs/models/shared/confluencesourceconnectorconfiginput.md b/docs/models/shared/confluencesourceconnectorconfiginput.md index 32862b7b..7bdd0e84 100644 --- a/docs/models/shared/confluencesourceconnectorconfiginput.md +++ b/docs/models/shared/confluencesourceconnectorconfiginput.md @@ -8,8 +8,10 @@ | `url` | *str* | :heavy_check_mark: | N/A | | `username` | *str* | :heavy_check_mark: | N/A | | `cloud` | *Optional[bool]* | :heavy_minus_sign: | N/A | +| `extract_files` | *Optional[bool]* | :heavy_minus_sign: | N/A | +| `extract_images` | *Optional[bool]* | :heavy_minus_sign: | N/A | | `max_num_of_docs_from_each_space` | *Optional[int]* | :heavy_minus_sign: | N/A | | `max_num_of_spaces` | *Optional[int]* | :heavy_minus_sign: | N/A | | `password` | *OptionalNullable[str]* | :heavy_minus_sign: | N/A | -| `spaces` | *OptionalNullable[str]* | :heavy_minus_sign: | N/A | +| `spaces` | List[*str*] | :heavy_minus_sign: | N/A | | `token` | *OptionalNullable[str]* | :heavy_minus_sign: | N/A | \ No newline at end of file diff --git a/docs/models/shared/jirasourceconnectorconfig.md b/docs/models/shared/jirasourceconnectorconfig.md index cdf0ab36..ee46373b 100644 --- a/docs/models/shared/jirasourceconnectorconfig.md +++ b/docs/models/shared/jirasourceconnectorconfig.md @@ -7,9 +7,9 @@ | ------------------------ | ------------------------ | ------------------------ | ------------------------ | | `url` | *str* | :heavy_check_mark: | N/A | | `username` | *str* | :heavy_check_mark: | N/A | -| `boards` | *OptionalNullable[str]* | :heavy_minus_sign: | N/A | +| `boards` | List[*str*] | :heavy_minus_sign: | N/A | | `cloud` | *OptionalNullable[bool]* | :heavy_minus_sign: | N/A | -| `issues` | *OptionalNullable[str]* | :heavy_minus_sign: | N/A | +| `issues` | List[*str*] | :heavy_minus_sign: | N/A | | `password` | *OptionalNullable[str]* | :heavy_minus_sign: | N/A | -| `projects` | *OptionalNullable[str]* | :heavy_minus_sign: | N/A | +| `projects` | List[*str*] | :heavy_minus_sign: | N/A | | `token` | *OptionalNullable[str]* | :heavy_minus_sign: | N/A | \ No newline at end of file diff --git a/docs/models/shared/jirasourceconnectorconfiginput.md b/docs/models/shared/jirasourceconnectorconfiginput.md index ba4d8e24..75b93c27 100644 --- a/docs/models/shared/jirasourceconnectorconfiginput.md +++ b/docs/models/shared/jirasourceconnectorconfiginput.md @@ -7,9 +7,9 @@ | ------------------------ | ------------------------ | ------------------------ | ------------------------ | | `url` | *str* | :heavy_check_mark: | N/A | | `username` | *str* | :heavy_check_mark: | N/A | -| `boards` | *OptionalNullable[str]* | :heavy_minus_sign: | N/A | +| `boards` | List[*str*] | :heavy_minus_sign: | N/A | | `cloud` | *OptionalNullable[bool]* | :heavy_minus_sign: | N/A | -| `issues` | *OptionalNullable[str]* | :heavy_minus_sign: | N/A | +| `issues` | List[*str*] | :heavy_minus_sign: | N/A | | `password` | *OptionalNullable[str]* | :heavy_minus_sign: | N/A | -| `projects` | *OptionalNullable[str]* | :heavy_minus_sign: | N/A | +| `projects` | List[*str*] | :heavy_minus_sign: | N/A | | `token` | *OptionalNullable[str]* | :heavy_minus_sign: | N/A | \ No newline at end of file diff --git a/docs/models/shared/partitionparameters.md b/docs/models/shared/partitionparameters.md index a7dc92e5..e7fd8e1a 100644 --- a/docs/models/shared/partitionparameters.md +++ b/docs/models/shared/partitionparameters.md @@ -26,6 +26,10 @@ | `overlap` | *Optional[int]* | :heavy_minus_sign: | Specifies the length of a string ('tail') to be drawn from each chunk and prefixed to the next chunk as a context-preserving mechanism. By default, this only applies to split-chunks where an oversized element is divided into multiple chunks by text-splitting. Default: 0 | | | `overlap_all` | *Optional[bool]* | :heavy_minus_sign: | When `True`, apply overlap between 'normal' chunks formed from whole elements and not subject to text-splitting. Use this with caution as it entails a certain level of 'pollution' of otherwise clean semantic chunk boundaries. Default: False | | | `pdf_infer_table_structure` | *Optional[bool]* | :heavy_minus_sign: | Deprecated! Use skip_infer_table_types to opt out of table extraction for any file type. If False and strategy=hi_res, no Table Elements will be extracted from pdf files regardless of skip_infer_table_types contents. | | +| `pdfminer_char_margin` | *OptionalNullable[float]* | :heavy_minus_sign: | If two characters are closer together than this margin they are considered part of the same line. The margin is specified relative to the width of the character. | | +| `pdfminer_line_margin` | *OptionalNullable[float]* | :heavy_minus_sign: | If two lines are close together they are considered to be part of the same paragraph. The margin is specified relative to the height of a line. | | +| `pdfminer_line_overlap` | *OptionalNullable[float]* | :heavy_minus_sign: | If two characters have more overlap than this they are considered to be on the same line. The overlap is specified relative to the minimum height of both characters. | | +| `pdfminer_word_margin` | *OptionalNullable[float]* | :heavy_minus_sign: | If two characters on the same line are further apart than this margin then they are considered to be two separate words, and an intermediate space will be added for readability. The margin is specified relative to the width of the character. | | | `similarity_threshold` | *OptionalNullable[float]* | :heavy_minus_sign: | A value between 0.0 and 1.0 describing the minimum similarity two elements must have to be included in the same chunk. Note that similar elements may be separated to meet chunk-size criteria; this value can only guarantees that two elements with similarity below the threshold will appear in separate chunks. | | | `skip_infer_table_types` | List[*str*] | :heavy_minus_sign: | The document types that you want to skip table extraction with. Default: [] | | | `split_pdf_allow_failed` | *Optional[bool]* | :heavy_minus_sign: | When `split_pdf_page` is set to `True`, this parameter defines the behavior when some of the parallel requests fail. By default `split_pdf_allow_failed` is set to `False` and any failed request send to the API will make the whole process break and raise an Exception. If `split_pdf_allow_failed` is set to `True`, the errors encountered while sending parallel requests will not break the processing - the resuling list of Elements will miss the data from errored pages. | | diff --git a/docs/models/shared/sharepointsourceconnectorconfig.md b/docs/models/shared/sharepointsourceconnectorconfig.md index fdb9e7a3..493738f5 100644 --- a/docs/models/shared/sharepointsourceconnectorconfig.md +++ b/docs/models/shared/sharepointsourceconnectorconfig.md @@ -9,4 +9,7 @@ | `client_id` | *str* | :heavy_check_mark: | N/A | | `recursive` | *bool* | :heavy_check_mark: | N/A | | `site` | *str* | :heavy_check_mark: | N/A | +| `tenant` | *str* | :heavy_check_mark: | N/A | +| `user_pname` | *str* | :heavy_check_mark: | N/A | +| `authority_url` | *Optional[str]* | :heavy_minus_sign: | N/A | | `path` | *OptionalNullable[str]* | :heavy_minus_sign: | N/A | \ No newline at end of file diff --git a/docs/models/shared/sharepointsourceconnectorconfiginput.md b/docs/models/shared/sharepointsourceconnectorconfiginput.md index 1f2c2e4d..b67533c8 100644 --- a/docs/models/shared/sharepointsourceconnectorconfiginput.md +++ b/docs/models/shared/sharepointsourceconnectorconfiginput.md @@ -8,5 +8,8 @@ | `client_cred` | *str* | :heavy_check_mark: | N/A | | `client_id` | *str* | :heavy_check_mark: | N/A | | `site` | *str* | :heavy_check_mark: | N/A | +| `tenant` | *str* | :heavy_check_mark: | N/A | +| `user_pname` | *str* | :heavy_check_mark: | N/A | +| `authority_url` | *Optional[str]* | :heavy_minus_sign: | N/A | | `path` | *OptionalNullable[str]* | :heavy_minus_sign: | N/A | | `recursive` | *Optional[bool]* | :heavy_minus_sign: | N/A | \ No newline at end of file diff --git a/docs/models/shared/snowflakedestinationconnectorconfig.md b/docs/models/shared/snowflakedestinationconnectorconfig.md index b7858812..badd6de6 100644 --- a/docs/models/shared/snowflakedestinationconnectorconfig.md +++ b/docs/models/shared/snowflakedestinationconnectorconfig.md @@ -13,6 +13,6 @@ | `port` | *int* | :heavy_check_mark: | N/A | | `record_id_key` | *str* | :heavy_check_mark: | N/A | | `role` | *str* | :heavy_check_mark: | N/A | -| `schema_` | *str* | :heavy_check_mark: | N/A | | `table_name` | *str* | :heavy_check_mark: | N/A | -| `user` | *str* | :heavy_check_mark: | N/A | \ No newline at end of file +| `user` | *str* | :heavy_check_mark: | N/A | +| `schema_` | *Optional[str]* | :heavy_minus_sign: | N/A | \ No newline at end of file diff --git a/docs/models/shared/snowflakedestinationconnectorconfiginput.md b/docs/models/shared/snowflakedestinationconnectorconfiginput.md index 8abc485c..99f23c57 100644 --- a/docs/models/shared/snowflakedestinationconnectorconfiginput.md +++ b/docs/models/shared/snowflakedestinationconnectorconfiginput.md @@ -12,9 +12,9 @@ | `id_column` | *str* | :heavy_check_mark: | N/A | | `password` | *str* | :heavy_check_mark: | N/A | | `role` | *str* | :heavy_check_mark: | N/A | -| `schema_` | *str* | :heavy_check_mark: | N/A | | `table_name` | *str* | :heavy_check_mark: | N/A | | `user` | *str* | :heavy_check_mark: | N/A | | `batch_size` | *Optional[int]* | :heavy_minus_sign: | N/A | | `port` | *Optional[int]* | :heavy_minus_sign: | N/A | -| `record_id_key` | *OptionalNullable[str]* | :heavy_minus_sign: | N/A | \ No newline at end of file +| `record_id_key` | *OptionalNullable[str]* | :heavy_minus_sign: | N/A | +| `schema_` | *Optional[str]* | :heavy_minus_sign: | N/A | \ No newline at end of file diff --git a/docs/models/shared/snowflakesourceconnectorconfig.md b/docs/models/shared/snowflakesourceconnectorconfig.md index 70f2f533..d71fc925 100644 --- a/docs/models/shared/snowflakesourceconnectorconfig.md +++ b/docs/models/shared/snowflakesourceconnectorconfig.md @@ -14,6 +14,6 @@ | `password` | *str* | :heavy_check_mark: | N/A | | `port` | *int* | :heavy_check_mark: | N/A | | `role` | *str* | :heavy_check_mark: | N/A | -| `schema_` | *str* | :heavy_check_mark: | N/A | | `table_name` | *str* | :heavy_check_mark: | N/A | -| `user` | *str* | :heavy_check_mark: | N/A | \ No newline at end of file +| `user` | *str* | :heavy_check_mark: | N/A | +| `schema_` | *Optional[str]* | :heavy_minus_sign: | N/A | \ No newline at end of file diff --git a/docs/models/shared/snowflakesourceconnectorconfiginput.md b/docs/models/shared/snowflakesourceconnectorconfiginput.md index 7f1dd837..fb9e0406 100644 --- a/docs/models/shared/snowflakesourceconnectorconfiginput.md +++ b/docs/models/shared/snowflakesourceconnectorconfiginput.md @@ -11,9 +11,9 @@ | `id_column` | *str* | :heavy_check_mark: | N/A | | `password` | *str* | :heavy_check_mark: | N/A | | `role` | *str* | :heavy_check_mark: | N/A | -| `schema_` | *str* | :heavy_check_mark: | N/A | | `table_name` | *str* | :heavy_check_mark: | N/A | | `user` | *str* | :heavy_check_mark: | N/A | | `batch_size` | *Optional[int]* | :heavy_minus_sign: | N/A | | `fields` | List[*str*] | :heavy_minus_sign: | N/A | -| `port` | *Optional[int]* | :heavy_minus_sign: | N/A | \ No newline at end of file +| `port` | *Optional[int]* | :heavy_minus_sign: | N/A | +| `schema_` | *Optional[str]* | :heavy_minus_sign: | N/A | \ No newline at end of file diff --git a/gen.yaml b/gen.yaml index 9e092c1e..305b4952 100644 --- a/gen.yaml +++ b/gen.yaml @@ -12,7 +12,7 @@ generation: oAuth2ClientCredentialsEnabled: false oAuth2PasswordEnabled: false python: - version: 0.31.6 + version: 0.32.0 additionalDependencies: dev: deepdiff: '>=6.0' diff --git a/pyproject.toml b/pyproject.toml index 1d10631a..fe19dc4f 100644 --- a/pyproject.toml +++ b/pyproject.toml @@ -1,6 +1,6 @@ [project] name = "unstructured-client" -version = "0.31.6" +version = "0.32.0" description = "Python Client SDK for Unstructured API" authors = [{ name = "Unstructured" },] readme = "README-PYPI.md" diff --git a/src/unstructured_client/_version.py b/src/unstructured_client/_version.py index cf8214b2..a7e13028 100644 --- a/src/unstructured_client/_version.py +++ b/src/unstructured_client/_version.py @@ -3,10 +3,10 @@ import importlib.metadata __title__: str = "unstructured-client" -__version__: str = "0.31.6" -__openapi_doc_version__: str = "1.0.81" -__gen_version__: str = "2.562.2" -__user_agent__: str = "speakeasy-sdk/python 0.31.6 2.562.2 1.0.81 unstructured-client" +__version__: str = "0.32.0" +__openapi_doc_version__: str = "1.1.4" +__gen_version__: str = "2.563.0" +__user_agent__: str = "speakeasy-sdk/python 0.32.0 2.563.0 1.1.4 unstructured-client" try: if __package__ is not None: diff --git a/src/unstructured_client/destinations.py b/src/unstructured_client/destinations.py index 64fd3568..6eba26da 100644 --- a/src/unstructured_client/destinations.py +++ b/src/unstructured_client/destinations.py @@ -86,7 +86,7 @@ def create_destination( hook_ctx=HookContext( base_url=base_url or "", operation_id="create_destination", - oauth2_scopes=None, + oauth2_scopes=[], security_source=self.sdk_configuration.security, ), request=req, @@ -206,7 +206,7 @@ async def create_destination_async( hook_ctx=HookContext( base_url=base_url or "", operation_id="create_destination", - oauth2_scopes=None, + oauth2_scopes=[], security_source=self.sdk_configuration.security, ), request=req, @@ -319,7 +319,7 @@ def delete_destination( hook_ctx=HookContext( base_url=base_url or "", operation_id="delete_destination", - oauth2_scopes=None, + oauth2_scopes=[], security_source=self.sdk_configuration.security, ), request=req, @@ -430,7 +430,7 @@ async def delete_destination_async( hook_ctx=HookContext( base_url=base_url or "", operation_id="delete_destination", - oauth2_scopes=None, + oauth2_scopes=[], security_source=self.sdk_configuration.security, ), request=req, @@ -540,7 +540,7 @@ def get_destination( hook_ctx=HookContext( base_url=base_url or "", operation_id="get_destination", - oauth2_scopes=None, + oauth2_scopes=[], security_source=self.sdk_configuration.security, ), request=req, @@ -652,7 +652,7 @@ async def get_destination_async( hook_ctx=HookContext( base_url=base_url or "", operation_id="get_destination", - oauth2_scopes=None, + oauth2_scopes=[], security_source=self.sdk_configuration.security, ), request=req, @@ -765,7 +765,7 @@ def list_destinations( hook_ctx=HookContext( base_url=base_url or "", operation_id="list_destinations", - oauth2_scopes=None, + oauth2_scopes=[], security_source=self.sdk_configuration.security, ), request=req, @@ -879,7 +879,7 @@ async def list_destinations_async( hook_ctx=HookContext( base_url=base_url or "", operation_id="list_destinations", - oauth2_scopes=None, + oauth2_scopes=[], security_source=self.sdk_configuration.security, ), request=req, @@ -1000,7 +1000,7 @@ def update_destination( hook_ctx=HookContext( base_url=base_url or "", operation_id="update_destination", - oauth2_scopes=None, + oauth2_scopes=[], security_source=self.sdk_configuration.security, ), request=req, @@ -1120,7 +1120,7 @@ async def update_destination_async( hook_ctx=HookContext( base_url=base_url or "", operation_id="update_destination", - oauth2_scopes=None, + oauth2_scopes=[], security_source=self.sdk_configuration.security, ), request=req, diff --git a/src/unstructured_client/jobs.py b/src/unstructured_client/jobs.py index fdd8c1b7..50eef1b4 100644 --- a/src/unstructured_client/jobs.py +++ b/src/unstructured_client/jobs.py @@ -78,7 +78,7 @@ def cancel_job( hook_ctx=HookContext( base_url=base_url or "", operation_id="cancel_job", - oauth2_scopes=None, + oauth2_scopes=[], security_source=self.sdk_configuration.security, ), request=req, @@ -188,7 +188,7 @@ async def cancel_job_async( hook_ctx=HookContext( base_url=base_url or "", operation_id="cancel_job", - oauth2_scopes=None, + oauth2_scopes=[], security_source=self.sdk_configuration.security, ), request=req, @@ -299,7 +299,7 @@ def download_job_output( hook_ctx=HookContext( base_url=base_url or "", operation_id="download_job_output", - oauth2_scopes=None, + oauth2_scopes=[], security_source=self.sdk_configuration.security, ), request=req, @@ -410,7 +410,7 @@ async def download_job_output_async( hook_ctx=HookContext( base_url=base_url or "", operation_id="download_job_output", - oauth2_scopes=None, + oauth2_scopes=[], security_source=self.sdk_configuration.security, ), request=req, @@ -518,7 +518,7 @@ def get_job( hook_ctx=HookContext( base_url=base_url or "", operation_id="get_job", - oauth2_scopes=None, + oauth2_scopes=[], security_source=self.sdk_configuration.security, ), request=req, @@ -628,7 +628,7 @@ async def get_job_async( hook_ctx=HookContext( base_url=base_url or "", operation_id="get_job", - oauth2_scopes=None, + oauth2_scopes=[], security_source=self.sdk_configuration.security, ), request=req, @@ -738,7 +738,7 @@ def list_jobs( hook_ctx=HookContext( base_url=base_url or "", operation_id="list_jobs", - oauth2_scopes=None, + oauth2_scopes=[], security_source=self.sdk_configuration.security, ), request=req, @@ -848,7 +848,7 @@ async def list_jobs_async( hook_ctx=HookContext( base_url=base_url or "", operation_id="list_jobs", - oauth2_scopes=None, + oauth2_scopes=[], security_source=self.sdk_configuration.security, ), request=req, diff --git a/src/unstructured_client/models/shared/astradbconnectorconfiginput.py b/src/unstructured_client/models/shared/astradbconnectorconfiginput.py index cb1c8dec..39eee29d 100644 --- a/src/unstructured_client/models/shared/astradbconnectorconfiginput.py +++ b/src/unstructured_client/models/shared/astradbconnectorconfiginput.py @@ -18,6 +18,7 @@ class AstraDBConnectorConfigInputTypedDict(TypedDict): collection_name: str token: str batch_size: NotRequired[int] + flatten_metadata: NotRequired[bool] keyspace: NotRequired[Nullable[str]] @@ -30,11 +31,13 @@ class AstraDBConnectorConfigInput(BaseModel): batch_size: Optional[int] = 20 + flatten_metadata: Optional[bool] = False + keyspace: OptionalNullable[str] = UNSET @model_serializer(mode="wrap") def serialize_model(self, handler): - optional_fields = ["batch_size", "keyspace"] + optional_fields = ["batch_size", "flatten_metadata", "keyspace"] nullable_fields = ["keyspace"] null_default_fields = [] diff --git a/src/unstructured_client/models/shared/confluencesourceconnectorconfig.py b/src/unstructured_client/models/shared/confluencesourceconnectorconfig.py index 1fe9023a..02cf4597 100644 --- a/src/unstructured_client/models/shared/confluencesourceconnectorconfig.py +++ b/src/unstructured_client/models/shared/confluencesourceconnectorconfig.py @@ -2,6 +2,7 @@ from __future__ import annotations from pydantic import model_serializer +from typing import List, Optional from typing_extensions import NotRequired, TypedDict from unstructured_client.types import ( BaseModel, @@ -16,9 +17,11 @@ class ConfluenceSourceConnectorConfigTypedDict(TypedDict): cloud: bool max_num_of_docs_from_each_space: int max_num_of_spaces: int - spaces: Nullable[str] + spaces: Nullable[List[str]] url: str username: str + extract_files: NotRequired[bool] + extract_images: NotRequired[bool] password: NotRequired[Nullable[str]] token: NotRequired[Nullable[str]] @@ -30,19 +33,23 @@ class ConfluenceSourceConnectorConfig(BaseModel): max_num_of_spaces: int - spaces: Nullable[str] + spaces: Nullable[List[str]] url: str username: str + extract_files: Optional[bool] = False + + extract_images: Optional[bool] = False + password: OptionalNullable[str] = UNSET token: OptionalNullable[str] = UNSET @model_serializer(mode="wrap") def serialize_model(self, handler): - optional_fields = ["password", "token"] + optional_fields = ["extract_files", "extract_images", "password", "token"] nullable_fields = ["spaces", "password", "token"] null_default_fields = [] diff --git a/src/unstructured_client/models/shared/confluencesourceconnectorconfiginput.py b/src/unstructured_client/models/shared/confluencesourceconnectorconfiginput.py index 7f4cb4ee..2afec1d1 100644 --- a/src/unstructured_client/models/shared/confluencesourceconnectorconfiginput.py +++ b/src/unstructured_client/models/shared/confluencesourceconnectorconfiginput.py @@ -2,7 +2,7 @@ from __future__ import annotations from pydantic import model_serializer -from typing import Optional +from typing import List, Optional from typing_extensions import NotRequired, TypedDict from unstructured_client.types import ( BaseModel, @@ -17,10 +17,12 @@ class ConfluenceSourceConnectorConfigInputTypedDict(TypedDict): url: str username: str cloud: NotRequired[bool] + extract_files: NotRequired[bool] + extract_images: NotRequired[bool] max_num_of_docs_from_each_space: NotRequired[int] max_num_of_spaces: NotRequired[int] password: NotRequired[Nullable[str]] - spaces: NotRequired[Nullable[str]] + spaces: NotRequired[Nullable[List[str]]] token: NotRequired[Nullable[str]] @@ -31,13 +33,17 @@ class ConfluenceSourceConnectorConfigInput(BaseModel): cloud: Optional[bool] = False + extract_files: Optional[bool] = False + + extract_images: Optional[bool] = False + max_num_of_docs_from_each_space: Optional[int] = 150 max_num_of_spaces: Optional[int] = 500 password: OptionalNullable[str] = UNSET - spaces: OptionalNullable[str] = UNSET + spaces: OptionalNullable[List[str]] = UNSET token: OptionalNullable[str] = UNSET @@ -45,6 +51,8 @@ class ConfluenceSourceConnectorConfigInput(BaseModel): def serialize_model(self, handler): optional_fields = [ "cloud", + "extract_files", + "extract_images", "max_num_of_docs_from_each_space", "max_num_of_spaces", "password", diff --git a/src/unstructured_client/models/shared/createdestinationconnector.py b/src/unstructured_client/models/shared/createdestinationconnector.py index 79525294..a6699c29 100644 --- a/src/unstructured_client/models/shared/createdestinationconnector.py +++ b/src/unstructured_client/models/shared/createdestinationconnector.py @@ -98,10 +98,10 @@ DeltaTableConnectorConfigInputTypedDict, QdrantCloudDestinationConnectorConfigInputTypedDict, PineconeDestinationConnectorConfigInputTypedDict, - AstraDBConnectorConfigInputTypedDict, Neo4jDestinationConnectorConfigInputTypedDict, OneDriveDestinationConnectorConfigInputTypedDict, S3DestinationConnectorConfigInputTypedDict, + AstraDBConnectorConfigInputTypedDict, MilvusDestinationConnectorConfigInputTypedDict, DatabricksVolumesConnectorConfigInputTypedDict, PostgresDestinationConnectorConfigInputTypedDict, @@ -125,10 +125,10 @@ DeltaTableConnectorConfigInput, QdrantCloudDestinationConnectorConfigInput, PineconeDestinationConnectorConfigInput, - AstraDBConnectorConfigInput, Neo4jDestinationConnectorConfigInput, OneDriveDestinationConnectorConfigInput, S3DestinationConnectorConfigInput, + AstraDBConnectorConfigInput, MilvusDestinationConnectorConfigInput, DatabricksVolumesConnectorConfigInput, PostgresDestinationConnectorConfigInput, diff --git a/src/unstructured_client/models/shared/createsourceconnector.py b/src/unstructured_client/models/shared/createsourceconnector.py index bd296e1e..46f62862 100644 --- a/src/unstructured_client/models/shared/createsourceconnector.py +++ b/src/unstructured_client/models/shared/createsourceconnector.py @@ -95,20 +95,20 @@ GCSSourceConnectorConfigInputTypedDict, ElasticsearchConnectorConfigInputTypedDict, DropboxSourceConnectorConfigInputTypedDict, - SalesforceSourceConnectorConfigInputTypedDict, GoogleDriveSourceConnectorConfigInputTypedDict, + SalesforceSourceConnectorConfigInputTypedDict, ZendeskSourceConnectorConfigInputTypedDict, - SharePointSourceConnectorConfigInputTypedDict, AzureSourceConnectorConfigInputTypedDict, S3SourceConnectorConfigInputTypedDict, DatabricksVolumesConnectorConfigInputTypedDict, + KafkaCloudSourceConnectorConfigInputTypedDict, OneDriveSourceConnectorConfigInputTypedDict, OutlookSourceConnectorConfigInputTypedDict, - KafkaCloudSourceConnectorConfigInputTypedDict, - ConfluenceSourceConnectorConfigInputTypedDict, + SharePointSourceConnectorConfigInputTypedDict, JiraSourceConnectorConfigInputTypedDict, CouchbaseSourceConnectorConfigInputTypedDict, PostgresSourceConnectorConfigInputTypedDict, + ConfluenceSourceConnectorConfigInputTypedDict, SnowflakeSourceConnectorConfigInputTypedDict, ], ) @@ -122,20 +122,20 @@ GCSSourceConnectorConfigInput, ElasticsearchConnectorConfigInput, DropboxSourceConnectorConfigInput, - SalesforceSourceConnectorConfigInput, GoogleDriveSourceConnectorConfigInput, + SalesforceSourceConnectorConfigInput, ZendeskSourceConnectorConfigInput, - SharePointSourceConnectorConfigInput, AzureSourceConnectorConfigInput, S3SourceConnectorConfigInput, DatabricksVolumesConnectorConfigInput, + KafkaCloudSourceConnectorConfigInput, OneDriveSourceConnectorConfigInput, OutlookSourceConnectorConfigInput, - KafkaCloudSourceConnectorConfigInput, - ConfluenceSourceConnectorConfigInput, + SharePointSourceConnectorConfigInput, JiraSourceConnectorConfigInput, CouchbaseSourceConnectorConfigInput, PostgresSourceConnectorConfigInput, + ConfluenceSourceConnectorConfigInput, SnowflakeSourceConnectorConfigInput, ], ) diff --git a/src/unstructured_client/models/shared/jirasourceconnectorconfig.py b/src/unstructured_client/models/shared/jirasourceconnectorconfig.py index b0d710b6..e5486770 100644 --- a/src/unstructured_client/models/shared/jirasourceconnectorconfig.py +++ b/src/unstructured_client/models/shared/jirasourceconnectorconfig.py @@ -2,6 +2,7 @@ from __future__ import annotations from pydantic import model_serializer +from typing import List from typing_extensions import NotRequired, TypedDict from unstructured_client.types import ( BaseModel, @@ -15,11 +16,11 @@ class JiraSourceConnectorConfigTypedDict(TypedDict): url: str username: str - boards: NotRequired[Nullable[str]] + boards: NotRequired[Nullable[List[str]]] cloud: NotRequired[Nullable[bool]] - issues: NotRequired[Nullable[str]] + issues: NotRequired[Nullable[List[str]]] password: NotRequired[Nullable[str]] - projects: NotRequired[Nullable[str]] + projects: NotRequired[Nullable[List[str]]] token: NotRequired[Nullable[str]] @@ -28,15 +29,15 @@ class JiraSourceConnectorConfig(BaseModel): username: str - boards: OptionalNullable[str] = UNSET + boards: OptionalNullable[List[str]] = UNSET cloud: OptionalNullable[bool] = UNSET - issues: OptionalNullable[str] = UNSET + issues: OptionalNullable[List[str]] = UNSET password: OptionalNullable[str] = UNSET - projects: OptionalNullable[str] = UNSET + projects: OptionalNullable[List[str]] = UNSET token: OptionalNullable[str] = UNSET diff --git a/src/unstructured_client/models/shared/jirasourceconnectorconfiginput.py b/src/unstructured_client/models/shared/jirasourceconnectorconfiginput.py index f73ab739..624def94 100644 --- a/src/unstructured_client/models/shared/jirasourceconnectorconfiginput.py +++ b/src/unstructured_client/models/shared/jirasourceconnectorconfiginput.py @@ -2,6 +2,7 @@ from __future__ import annotations from pydantic import model_serializer +from typing import List from typing_extensions import NotRequired, TypedDict from unstructured_client.types import ( BaseModel, @@ -15,11 +16,11 @@ class JiraSourceConnectorConfigInputTypedDict(TypedDict): url: str username: str - boards: NotRequired[Nullable[str]] + boards: NotRequired[Nullable[List[str]]] cloud: NotRequired[Nullable[bool]] - issues: NotRequired[Nullable[str]] + issues: NotRequired[Nullable[List[str]]] password: NotRequired[Nullable[str]] - projects: NotRequired[Nullable[str]] + projects: NotRequired[Nullable[List[str]]] token: NotRequired[Nullable[str]] @@ -28,15 +29,15 @@ class JiraSourceConnectorConfigInput(BaseModel): username: str - boards: OptionalNullable[str] = UNSET + boards: OptionalNullable[List[str]] = UNSET cloud: OptionalNullable[bool] = UNSET - issues: OptionalNullable[str] = UNSET + issues: OptionalNullable[List[str]] = UNSET password: OptionalNullable[str] = UNSET - projects: OptionalNullable[str] = UNSET + projects: OptionalNullable[List[str]] = UNSET token: OptionalNullable[str] = UNSET diff --git a/src/unstructured_client/models/shared/partition_parameters.py b/src/unstructured_client/models/shared/partition_parameters.py index 43cc698f..f494c68d 100644 --- a/src/unstructured_client/models/shared/partition_parameters.py +++ b/src/unstructured_client/models/shared/partition_parameters.py @@ -144,6 +144,14 @@ class PartitionParametersTypedDict(TypedDict): r"""When `True`, apply overlap between 'normal' chunks formed from whole elements and not subject to text-splitting. Use this with caution as it entails a certain level of 'pollution' of otherwise clean semantic chunk boundaries. Default: False""" pdf_infer_table_structure: NotRequired[bool] r"""Deprecated! Use skip_infer_table_types to opt out of table extraction for any file type. If False and strategy=hi_res, no Table Elements will be extracted from pdf files regardless of skip_infer_table_types contents.""" + pdfminer_char_margin: NotRequired[Nullable[float]] + r"""If two characters are closer together than this margin they are considered part of the same line. The margin is specified relative to the width of the character.""" + pdfminer_line_margin: NotRequired[Nullable[float]] + r"""If two lines are close together they are considered to be part of the same paragraph. The margin is specified relative to the height of a line.""" + pdfminer_line_overlap: NotRequired[Nullable[float]] + r"""If two characters have more overlap than this they are considered to be on the same line. The overlap is specified relative to the minimum height of both characters.""" + pdfminer_word_margin: NotRequired[Nullable[float]] + r"""If two characters on the same line are further apart than this margin then they are considered to be two separate words, and an intermediate space will be added for readability. The margin is specified relative to the width of the character.""" similarity_threshold: NotRequired[Nullable[float]] r"""A value between 0.0 and 1.0 describing the minimum similarity two elements must have to be included in the same chunk. Note that similar elements may be separated to meet chunk-size criteria; this value can only guarantees that two elements with similarity below the threshold will appear in separate chunks.""" skip_infer_table_types: NotRequired[List[str]] @@ -263,6 +271,26 @@ class PartitionParameters(BaseModel): ] = True r"""Deprecated! Use skip_infer_table_types to opt out of table extraction for any file type. If False and strategy=hi_res, no Table Elements will be extracted from pdf files regardless of skip_infer_table_types contents.""" + pdfminer_char_margin: Annotated[ + OptionalNullable[float], FieldMetadata(multipart=True) + ] = None + r"""If two characters are closer together than this margin they are considered part of the same line. The margin is specified relative to the width of the character.""" + + pdfminer_line_margin: Annotated[ + OptionalNullable[float], FieldMetadata(multipart=True) + ] = None + r"""If two lines are close together they are considered to be part of the same paragraph. The margin is specified relative to the height of a line.""" + + pdfminer_line_overlap: Annotated[ + OptionalNullable[float], FieldMetadata(multipart=True) + ] = None + r"""If two characters have more overlap than this they are considered to be on the same line. The overlap is specified relative to the minimum height of both characters.""" + + pdfminer_word_margin: Annotated[ + OptionalNullable[float], FieldMetadata(multipart=True) + ] = None + r"""If two characters on the same line are further apart than this margin then they are considered to be two separate words, and an intermediate space will be added for readability. The margin is specified relative to the width of the character.""" + similarity_threshold: Annotated[ OptionalNullable[float], FieldMetadata(multipart=True) ] = None @@ -360,6 +388,10 @@ def serialize_model(self, handler): "overlap", "overlap_all", "pdf_infer_table_structure", + "pdfminer_char_margin", + "pdfminer_line_margin", + "pdfminer_line_overlap", + "pdfminer_word_margin", "similarity_threshold", "skip_infer_table_types", "split_pdf_allow_failed", @@ -386,6 +418,10 @@ def serialize_model(self, handler): "include_orig_elements", "max_characters", "new_after_n_chars", + "pdfminer_char_margin", + "pdfminer_line_margin", + "pdfminer_line_overlap", + "pdfminer_word_margin", "similarity_threshold", "starting_page_number", "table_ocr_agent", @@ -400,6 +436,10 @@ def serialize_model(self, handler): "include_orig_elements", "max_characters", "new_after_n_chars", + "pdfminer_char_margin", + "pdfminer_line_margin", + "pdfminer_line_overlap", + "pdfminer_word_margin", "similarity_threshold", "starting_page_number", "table_ocr_agent", diff --git a/src/unstructured_client/models/shared/sharepointsourceconnectorconfig.py b/src/unstructured_client/models/shared/sharepointsourceconnectorconfig.py index 742e7ba5..1ec70918 100644 --- a/src/unstructured_client/models/shared/sharepointsourceconnectorconfig.py +++ b/src/unstructured_client/models/shared/sharepointsourceconnectorconfig.py @@ -2,6 +2,7 @@ from __future__ import annotations from pydantic import model_serializer +from typing import Optional from typing_extensions import NotRequired, TypedDict from unstructured_client.types import ( BaseModel, @@ -17,6 +18,9 @@ class SharePointSourceConnectorConfigTypedDict(TypedDict): client_id: str recursive: bool site: str + tenant: str + user_pname: str + authority_url: NotRequired[str] path: NotRequired[Nullable[str]] @@ -29,11 +33,17 @@ class SharePointSourceConnectorConfig(BaseModel): site: str + tenant: str + + user_pname: str + + authority_url: Optional[str] = "https://login.microsoftonline.com" + path: OptionalNullable[str] = UNSET @model_serializer(mode="wrap") def serialize_model(self, handler): - optional_fields = ["path"] + optional_fields = ["authority_url", "path"] nullable_fields = ["path"] null_default_fields = [] diff --git a/src/unstructured_client/models/shared/sharepointsourceconnectorconfiginput.py b/src/unstructured_client/models/shared/sharepointsourceconnectorconfiginput.py index 2f1ebff6..c9ce9003 100644 --- a/src/unstructured_client/models/shared/sharepointsourceconnectorconfiginput.py +++ b/src/unstructured_client/models/shared/sharepointsourceconnectorconfiginput.py @@ -17,6 +17,9 @@ class SharePointSourceConnectorConfigInputTypedDict(TypedDict): client_cred: str client_id: str site: str + tenant: str + user_pname: str + authority_url: NotRequired[str] path: NotRequired[Nullable[str]] recursive: NotRequired[bool] @@ -28,13 +31,19 @@ class SharePointSourceConnectorConfigInput(BaseModel): site: str + tenant: str + + user_pname: str + + authority_url: Optional[str] = "https://login.microsoftonline.com" + path: OptionalNullable[str] = UNSET recursive: Optional[bool] = False @model_serializer(mode="wrap") def serialize_model(self, handler): - optional_fields = ["path", "recursive"] + optional_fields = ["authority_url", "path", "recursive"] nullable_fields = ["path"] null_default_fields = [] diff --git a/src/unstructured_client/models/shared/snowflakedestinationconnectorconfig.py b/src/unstructured_client/models/shared/snowflakedestinationconnectorconfig.py index 644566f1..0ea4aa0e 100644 --- a/src/unstructured_client/models/shared/snowflakedestinationconnectorconfig.py +++ b/src/unstructured_client/models/shared/snowflakedestinationconnectorconfig.py @@ -2,7 +2,8 @@ from __future__ import annotations import pydantic -from typing_extensions import Annotated, TypedDict +from typing import Optional +from typing_extensions import Annotated, NotRequired, TypedDict from unstructured_client.types import BaseModel @@ -15,9 +16,9 @@ class SnowflakeDestinationConnectorConfigTypedDict(TypedDict): port: int record_id_key: str role: str - schema_: str table_name: str user: str + schema_: NotRequired[str] class SnowflakeDestinationConnectorConfig(BaseModel): @@ -37,8 +38,8 @@ class SnowflakeDestinationConnectorConfig(BaseModel): role: str - schema_: Annotated[str, pydantic.Field(alias="schema")] - table_name: str user: str + + schema_: Annotated[Optional[str], pydantic.Field(alias="schema")] = None diff --git a/src/unstructured_client/models/shared/snowflakedestinationconnectorconfiginput.py b/src/unstructured_client/models/shared/snowflakedestinationconnectorconfiginput.py index 9f8561c3..ff95a0a4 100644 --- a/src/unstructured_client/models/shared/snowflakedestinationconnectorconfiginput.py +++ b/src/unstructured_client/models/shared/snowflakedestinationconnectorconfiginput.py @@ -22,12 +22,12 @@ class SnowflakeDestinationConnectorConfigInputTypedDict(TypedDict): id_column: str password: str role: str - schema_: str table_name: str user: str batch_size: NotRequired[int] port: NotRequired[int] record_id_key: NotRequired[Nullable[str]] + schema_: NotRequired[str] class SnowflakeDestinationConnectorConfigInput(BaseModel): @@ -45,8 +45,6 @@ class SnowflakeDestinationConnectorConfigInput(BaseModel): role: str - schema_: Annotated[str, pydantic.Field(alias="schema")] - table_name: str user: str @@ -57,9 +55,11 @@ class SnowflakeDestinationConnectorConfigInput(BaseModel): record_id_key: OptionalNullable[str] = UNSET + schema_: Annotated[Optional[str], pydantic.Field(alias="schema")] = None + @model_serializer(mode="wrap") def serialize_model(self, handler): - optional_fields = ["batch_size", "port", "record_id_key"] + optional_fields = ["batch_size", "port", "record_id_key", "schema"] nullable_fields = ["record_id_key"] null_default_fields = [] diff --git a/src/unstructured_client/models/shared/snowflakesourceconnectorconfig.py b/src/unstructured_client/models/shared/snowflakesourceconnectorconfig.py index b61f13c9..44cf176c 100644 --- a/src/unstructured_client/models/shared/snowflakesourceconnectorconfig.py +++ b/src/unstructured_client/models/shared/snowflakesourceconnectorconfig.py @@ -2,8 +2,8 @@ from __future__ import annotations import pydantic -from typing import List -from typing_extensions import Annotated, TypedDict +from typing import List, Optional +from typing_extensions import Annotated, NotRequired, TypedDict from unstructured_client.types import BaseModel @@ -17,9 +17,9 @@ class SnowflakeSourceConnectorConfigTypedDict(TypedDict): password: str port: int role: str - schema_: str table_name: str user: str + schema_: NotRequired[str] class SnowflakeSourceConnectorConfig(BaseModel): @@ -41,8 +41,8 @@ class SnowflakeSourceConnectorConfig(BaseModel): role: str - schema_: Annotated[str, pydantic.Field(alias="schema")] - table_name: str user: str + + schema_: Annotated[Optional[str], pydantic.Field(alias="schema")] = None diff --git a/src/unstructured_client/models/shared/snowflakesourceconnectorconfiginput.py b/src/unstructured_client/models/shared/snowflakesourceconnectorconfiginput.py index 81959991..7b7c1e97 100644 --- a/src/unstructured_client/models/shared/snowflakesourceconnectorconfiginput.py +++ b/src/unstructured_client/models/shared/snowflakesourceconnectorconfiginput.py @@ -21,12 +21,12 @@ class SnowflakeSourceConnectorConfigInputTypedDict(TypedDict): id_column: str password: str role: str - schema_: str table_name: str user: str batch_size: NotRequired[int] fields: NotRequired[Nullable[List[str]]] port: NotRequired[int] + schema_: NotRequired[str] class SnowflakeSourceConnectorConfigInput(BaseModel): @@ -42,8 +42,6 @@ class SnowflakeSourceConnectorConfigInput(BaseModel): role: str - schema_: Annotated[str, pydantic.Field(alias="schema")] - table_name: str user: str @@ -54,9 +52,11 @@ class SnowflakeSourceConnectorConfigInput(BaseModel): port: Optional[int] = 443 + schema_: Annotated[Optional[str], pydantic.Field(alias="schema")] = None + @model_serializer(mode="wrap") def serialize_model(self, handler): - optional_fields = ["batch_size", "fields", "port"] + optional_fields = ["batch_size", "fields", "port", "schema"] nullable_fields = ["fields"] null_default_fields = [] diff --git a/src/unstructured_client/models/shared/sourceconnectorinformation.py b/src/unstructured_client/models/shared/sourceconnectorinformation.py index 998a3cd9..427cff25 100644 --- a/src/unstructured_client/models/shared/sourceconnectorinformation.py +++ b/src/unstructured_client/models/shared/sourceconnectorinformation.py @@ -106,17 +106,17 @@ SalesforceSourceConnectorConfigTypedDict, GoogleDriveSourceConnectorConfigTypedDict, ZendeskSourceConnectorConfigTypedDict, - SharePointSourceConnectorConfigTypedDict, AzureSourceConnectorConfigTypedDict, OneDriveSourceConnectorConfigTypedDict, + KafkaCloudSourceConnectorConfigTypedDict, DatabricksVolumesConnectorConfigTypedDict, OutlookSourceConnectorConfigTypedDict, S3SourceConnectorConfigTypedDict, - KafkaCloudSourceConnectorConfigTypedDict, - ConfluenceSourceConnectorConfigTypedDict, + SharePointSourceConnectorConfigTypedDict, JiraSourceConnectorConfigTypedDict, CouchbaseSourceConnectorConfigTypedDict, PostgresSourceConnectorConfigTypedDict, + ConfluenceSourceConnectorConfigTypedDict, SnowflakeSourceConnectorConfigTypedDict, ], ) @@ -133,17 +133,17 @@ SalesforceSourceConnectorConfig, GoogleDriveSourceConnectorConfig, ZendeskSourceConnectorConfig, - SharePointSourceConnectorConfig, AzureSourceConnectorConfig, OneDriveSourceConnectorConfig, + KafkaCloudSourceConnectorConfig, DatabricksVolumesConnectorConfig, OutlookSourceConnectorConfig, S3SourceConnectorConfig, - KafkaCloudSourceConnectorConfig, - ConfluenceSourceConnectorConfig, + SharePointSourceConnectorConfig, JiraSourceConnectorConfig, CouchbaseSourceConnectorConfig, PostgresSourceConnectorConfig, + ConfluenceSourceConnectorConfig, SnowflakeSourceConnectorConfig, ], ) diff --git a/src/unstructured_client/models/shared/updatedestinationconnector.py b/src/unstructured_client/models/shared/updatedestinationconnector.py index 7abac038..c0499187 100644 --- a/src/unstructured_client/models/shared/updatedestinationconnector.py +++ b/src/unstructured_client/models/shared/updatedestinationconnector.py @@ -97,10 +97,10 @@ DeltaTableConnectorConfigInputTypedDict, QdrantCloudDestinationConnectorConfigInputTypedDict, PineconeDestinationConnectorConfigInputTypedDict, - AstraDBConnectorConfigInputTypedDict, Neo4jDestinationConnectorConfigInputTypedDict, OneDriveDestinationConnectorConfigInputTypedDict, S3DestinationConnectorConfigInputTypedDict, + AstraDBConnectorConfigInputTypedDict, MilvusDestinationConnectorConfigInputTypedDict, DatabricksVolumesConnectorConfigInputTypedDict, PostgresDestinationConnectorConfigInputTypedDict, @@ -124,10 +124,10 @@ DeltaTableConnectorConfigInput, QdrantCloudDestinationConnectorConfigInput, PineconeDestinationConnectorConfigInput, - AstraDBConnectorConfigInput, Neo4jDestinationConnectorConfigInput, OneDriveDestinationConnectorConfigInput, S3DestinationConnectorConfigInput, + AstraDBConnectorConfigInput, MilvusDestinationConnectorConfigInput, DatabricksVolumesConnectorConfigInput, PostgresDestinationConnectorConfigInput, diff --git a/src/unstructured_client/models/shared/updatesourceconnector.py b/src/unstructured_client/models/shared/updatesourceconnector.py index bae5ee7a..54c19445 100644 --- a/src/unstructured_client/models/shared/updatesourceconnector.py +++ b/src/unstructured_client/models/shared/updatesourceconnector.py @@ -94,20 +94,20 @@ GCSSourceConnectorConfigInputTypedDict, ElasticsearchConnectorConfigInputTypedDict, DropboxSourceConnectorConfigInputTypedDict, - SalesforceSourceConnectorConfigInputTypedDict, GoogleDriveSourceConnectorConfigInputTypedDict, + SalesforceSourceConnectorConfigInputTypedDict, ZendeskSourceConnectorConfigInputTypedDict, - SharePointSourceConnectorConfigInputTypedDict, AzureSourceConnectorConfigInputTypedDict, S3SourceConnectorConfigInputTypedDict, DatabricksVolumesConnectorConfigInputTypedDict, + KafkaCloudSourceConnectorConfigInputTypedDict, OneDriveSourceConnectorConfigInputTypedDict, OutlookSourceConnectorConfigInputTypedDict, - KafkaCloudSourceConnectorConfigInputTypedDict, - ConfluenceSourceConnectorConfigInputTypedDict, + SharePointSourceConnectorConfigInputTypedDict, JiraSourceConnectorConfigInputTypedDict, CouchbaseSourceConnectorConfigInputTypedDict, PostgresSourceConnectorConfigInputTypedDict, + ConfluenceSourceConnectorConfigInputTypedDict, SnowflakeSourceConnectorConfigInputTypedDict, ], ) @@ -121,20 +121,20 @@ GCSSourceConnectorConfigInput, ElasticsearchConnectorConfigInput, DropboxSourceConnectorConfigInput, - SalesforceSourceConnectorConfigInput, GoogleDriveSourceConnectorConfigInput, + SalesforceSourceConnectorConfigInput, ZendeskSourceConnectorConfigInput, - SharePointSourceConnectorConfigInput, AzureSourceConnectorConfigInput, S3SourceConnectorConfigInput, DatabricksVolumesConnectorConfigInput, + KafkaCloudSourceConnectorConfigInput, OneDriveSourceConnectorConfigInput, OutlookSourceConnectorConfigInput, - KafkaCloudSourceConnectorConfigInput, - ConfluenceSourceConnectorConfigInput, + SharePointSourceConnectorConfigInput, JiraSourceConnectorConfigInput, CouchbaseSourceConnectorConfigInput, PostgresSourceConnectorConfigInput, + ConfluenceSourceConnectorConfigInput, SnowflakeSourceConnectorConfigInput, ], ) diff --git a/src/unstructured_client/sources.py b/src/unstructured_client/sources.py index cfc75508..20d0d09d 100644 --- a/src/unstructured_client/sources.py +++ b/src/unstructured_client/sources.py @@ -85,7 +85,7 @@ def create_source( hook_ctx=HookContext( base_url=base_url or "", operation_id="create_source", - oauth2_scopes=None, + oauth2_scopes=[], security_source=self.sdk_configuration.security, ), request=req, @@ -204,7 +204,7 @@ async def create_source_async( hook_ctx=HookContext( base_url=base_url or "", operation_id="create_source", - oauth2_scopes=None, + oauth2_scopes=[], security_source=self.sdk_configuration.security, ), request=req, @@ -316,7 +316,7 @@ def delete_source( hook_ctx=HookContext( base_url=base_url or "", operation_id="delete_source", - oauth2_scopes=None, + oauth2_scopes=[], security_source=self.sdk_configuration.security, ), request=req, @@ -426,7 +426,7 @@ async def delete_source_async( hook_ctx=HookContext( base_url=base_url or "", operation_id="delete_source", - oauth2_scopes=None, + oauth2_scopes=[], security_source=self.sdk_configuration.security, ), request=req, @@ -536,7 +536,7 @@ def get_source( hook_ctx=HookContext( base_url=base_url or "", operation_id="get_source", - oauth2_scopes=None, + oauth2_scopes=[], security_source=self.sdk_configuration.security, ), request=req, @@ -648,7 +648,7 @@ async def get_source_async( hook_ctx=HookContext( base_url=base_url or "", operation_id="get_source", - oauth2_scopes=None, + oauth2_scopes=[], security_source=self.sdk_configuration.security, ), request=req, @@ -760,7 +760,7 @@ def list_sources( hook_ctx=HookContext( base_url=base_url or "", operation_id="list_sources", - oauth2_scopes=None, + oauth2_scopes=[], security_source=self.sdk_configuration.security, ), request=req, @@ -872,7 +872,7 @@ async def list_sources_async( hook_ctx=HookContext( base_url=base_url or "", operation_id="list_sources", - oauth2_scopes=None, + oauth2_scopes=[], security_source=self.sdk_configuration.security, ), request=req, @@ -991,7 +991,7 @@ def update_source( hook_ctx=HookContext( base_url=base_url or "", operation_id="update_source", - oauth2_scopes=None, + oauth2_scopes=[], security_source=self.sdk_configuration.security, ), request=req, @@ -1110,7 +1110,7 @@ async def update_source_async( hook_ctx=HookContext( base_url=base_url or "", operation_id="update_source", - oauth2_scopes=None, + oauth2_scopes=[], security_source=self.sdk_configuration.security, ), request=req, diff --git a/src/unstructured_client/workflows.py b/src/unstructured_client/workflows.py index 4fa96b14..18822198 100644 --- a/src/unstructured_client/workflows.py +++ b/src/unstructured_client/workflows.py @@ -81,7 +81,7 @@ def create_workflow( hook_ctx=HookContext( base_url=base_url or "", operation_id="create_workflow", - oauth2_scopes=None, + oauth2_scopes=[], security_source=self.sdk_configuration.security, ), request=req, @@ -196,7 +196,7 @@ async def create_workflow_async( hook_ctx=HookContext( base_url=base_url or "", operation_id="create_workflow", - oauth2_scopes=None, + oauth2_scopes=[], security_source=self.sdk_configuration.security, ), request=req, @@ -308,7 +308,7 @@ def delete_workflow( hook_ctx=HookContext( base_url=base_url or "", operation_id="delete_workflow", - oauth2_scopes=None, + oauth2_scopes=[], security_source=self.sdk_configuration.security, ), request=req, @@ -418,7 +418,7 @@ async def delete_workflow_async( hook_ctx=HookContext( base_url=base_url or "", operation_id="delete_workflow", - oauth2_scopes=None, + oauth2_scopes=[], security_source=self.sdk_configuration.security, ), request=req, @@ -528,7 +528,7 @@ def get_workflow( hook_ctx=HookContext( base_url=base_url or "", operation_id="get_workflow", - oauth2_scopes=None, + oauth2_scopes=[], security_source=self.sdk_configuration.security, ), request=req, @@ -640,7 +640,7 @@ async def get_workflow_async( hook_ctx=HookContext( base_url=base_url or "", operation_id="get_workflow", - oauth2_scopes=None, + oauth2_scopes=[], security_source=self.sdk_configuration.security, ), request=req, @@ -752,7 +752,7 @@ def list_workflows( hook_ctx=HookContext( base_url=base_url or "", operation_id="list_workflows", - oauth2_scopes=None, + oauth2_scopes=[], security_source=self.sdk_configuration.security, ), request=req, @@ -864,7 +864,7 @@ async def list_workflows_async( hook_ctx=HookContext( base_url=base_url or "", operation_id="list_workflows", - oauth2_scopes=None, + oauth2_scopes=[], security_source=self.sdk_configuration.security, ), request=req, @@ -983,7 +983,7 @@ def run_workflow( hook_ctx=HookContext( base_url=base_url or "", operation_id="run_workflow", - oauth2_scopes=None, + oauth2_scopes=[], security_source=self.sdk_configuration.security, ), request=req, @@ -1102,7 +1102,7 @@ async def run_workflow_async( hook_ctx=HookContext( base_url=base_url or "", operation_id="run_workflow", - oauth2_scopes=None, + oauth2_scopes=[], security_source=self.sdk_configuration.security, ), request=req, @@ -1217,7 +1217,7 @@ def update_workflow( hook_ctx=HookContext( base_url=base_url or "", operation_id="update_workflow", - oauth2_scopes=None, + oauth2_scopes=[], security_source=self.sdk_configuration.security, ), request=req, @@ -1332,7 +1332,7 @@ async def update_workflow_async( hook_ctx=HookContext( base_url=base_url or "", operation_id="update_workflow", - oauth2_scopes=None, + oauth2_scopes=[], security_source=self.sdk_configuration.security, ), request=req,