diff --git a/src/databricks/labs/ucx/source_code/known.json b/src/databricks/labs/ucx/source_code/known.json index 9f5de10ee9..52a792f8ec 100644 --- a/src/databricks/labs/ucx/source_code/known.json +++ b/src/databricks/labs/ucx/source_code/known.json @@ -19661,6 +19661,563 @@ "unidecode": { "unidecode": [] }, + "unstructured": { + "test_unstructured": [], + "test_unstructured.chunking": [], + "test_unstructured.chunking.test_base": [], + "test_unstructured.chunking.test_basic": [], + "test_unstructured.chunking.test_dispatch": [], + "test_unstructured.chunking.test_title": [], + "test_unstructured.cleaners": [], + "test_unstructured.cleaners.test_core": [], + "test_unstructured.cleaners.test_extract": [], + "test_unstructured.cleaners.test_translate": [], + "test_unstructured.documents": [], + "test_unstructured.documents.test_coordinates": [], + "test_unstructured.documents.test_elements": [], + "test_unstructured.documents.test_email_elements": [], + "test_unstructured.documents.test_html": [], + "test_unstructured.embed": [], + "test_unstructured.embed.test_octoai": [], + "test_unstructured.embed.test_openai": [], + "test_unstructured.embed.test_vertexai": [], + "test_unstructured.embed.test_voyageai": [], + "test_unstructured.file_utils": [], + "test_unstructured.file_utils.test_exploration": [], + "test_unstructured.file_utils.test_file_conversion": [], + "test_unstructured.file_utils.test_filetype": [], + "test_unstructured.file_utils.test_metadata": [], + "test_unstructured.metrics": [], + "test_unstructured.metrics.test_element_type": [], + "test_unstructured.metrics.test_evaluate": [], + "test_unstructured.metrics.test_table_formats": [], + "test_unstructured.metrics.test_table_structure": [], + "test_unstructured.metrics.test_text_extraction": [], + "test_unstructured.metrics.test_utils": [], + "test_unstructured.nlp": [], + "test_unstructured.nlp.mock_nltk": [], + "test_unstructured.nlp.test_partition": [], + "test_unstructured.nlp.test_tokenize": [], + "test_unstructured.partition": [], + "test_unstructured.partition.html": [], + "test_unstructured.partition.html.test_parser": [], + "test_unstructured.partition.html.test_partition": [], + "test_unstructured.partition.pdf_image": [], + "test_unstructured.partition.pdf_image.conftest": [], + "test_unstructured.partition.pdf_image.test_chipper": [], + "test_unstructured.partition.pdf_image.test_image": [], + "test_unstructured.partition.pdf_image.test_inference_utils": [], + "test_unstructured.partition.pdf_image.test_ocr": [], + "test_unstructured.partition.pdf_image.test_pdf": [], + "test_unstructured.partition.pdf_image.test_pdf_image_utils": [], + "test_unstructured.partition.pdf_image.test_pdfminer_processing": [], + "test_unstructured.partition.test_api": [], + "test_unstructured.partition.test_auto": [], + "test_unstructured.partition.test_common": [], + "test_unstructured.partition.test_constants": [], + "test_unstructured.partition.test_csv": [], + "test_unstructured.partition.test_doc": [], + "test_unstructured.partition.test_docx": [], + "test_unstructured.partition.test_email": [], + "test_unstructured.partition.test_epub": [], + "test_unstructured.partition.test_json": [], + "test_unstructured.partition.test_lang": [], + "test_unstructured.partition.test_md": [], + "test_unstructured.partition.test_msg": [], + "test_unstructured.partition.test_odt": [], + "test_unstructured.partition.test_org": [], + "test_unstructured.partition.test_ppt": [], + "test_unstructured.partition.test_pptx": [], + "test_unstructured.partition.test_rst": [], + "test_unstructured.partition.test_rtf": [], + "test_unstructured.partition.test_strategies": [], + "test_unstructured.partition.test_text": [], + "test_unstructured.partition.test_text_type": [], + "test_unstructured.partition.test_tsv": [], + "test_unstructured.partition.test_xlsx": [], + "test_unstructured.partition.test_xml_partition": [], + "test_unstructured.partition.utils": [], + "test_unstructured.partition.utils.test_config": [], + "test_unstructured.partition.utils.test_sorting": [], + "test_unstructured.partition.utils.test_xycut": [], + "test_unstructured.staging": [], + "test_unstructured.staging.test_base": [], + "test_unstructured.staging.test_baseplate": [], + "test_unstructured.staging.test_datasaur": [], + "test_unstructured.staging.test_huggingface": [], + "test_unstructured.staging.test_label_box": [], + "test_unstructured.staging.test_label_studio": [], + "test_unstructured.staging.test_prodigy": [], + "test_unstructured.staging.test_weaviate": [], + "test_unstructured.test_utils": [], + "test_unstructured.unit_utils": [], + "unstructured": [], + "unstructured.chunking": [], + "unstructured.chunking.base": [], + "unstructured.chunking.basic": [], + "unstructured.chunking.dispatch": [], + "unstructured.chunking.title": [], + "unstructured.cleaners": [], + "unstructured.cleaners.core": [], + "unstructured.cleaners.extract": [], + "unstructured.cleaners.translate": [], + "unstructured.documents": [], + "unstructured.documents.coordinates": [], + "unstructured.documents.elements": [], + "unstructured.documents.email_elements": [], + "unstructured.documents.html": [], + "unstructured.embed": [], + "unstructured.embed.bedrock": [], + "unstructured.embed.huggingface": [], + "unstructured.embed.interfaces": [], + "unstructured.embed.octoai": [], + "unstructured.embed.openai": [], + "unstructured.embed.vertexai": [], + "unstructured.embed.voyageai": [], + "unstructured.file_utils": [], + "unstructured.file_utils.encoding": [], + "unstructured.file_utils.exploration": [], + "unstructured.file_utils.file_conversion": [], + "unstructured.file_utils.filetype": [], + "unstructured.file_utils.google_filetype": [], + "unstructured.file_utils.metadata": [], + "unstructured.ingest": [], + "unstructured.ingest.cli": [], + "unstructured.ingest.cli.base": [], + "unstructured.ingest.cli.base.cmd": [], + "unstructured.ingest.cli.base.dest": [], + "unstructured.ingest.cli.base.src": [], + "unstructured.ingest.cli.cli": [], + "unstructured.ingest.cli.cmd_factory": [], + "unstructured.ingest.cli.cmds": [], + "unstructured.ingest.cli.cmds.airtable": [], + "unstructured.ingest.cli.cmds.astra": [], + "unstructured.ingest.cli.cmds.azure_cognitive_search": [], + "unstructured.ingest.cli.cmds.biomed": [], + "unstructured.ingest.cli.cmds.chroma": [], + "unstructured.ingest.cli.cmds.clarifai": [], + "unstructured.ingest.cli.cmds.confluence": [], + "unstructured.ingest.cli.cmds.databricks_volumes": [], + "unstructured.ingest.cli.cmds.delta_table": [], + "unstructured.ingest.cli.cmds.discord": [], + "unstructured.ingest.cli.cmds.elasticsearch": [], + "unstructured.ingest.cli.cmds.fsspec": [], + "unstructured.ingest.cli.cmds.fsspec.azure": [], + "unstructured.ingest.cli.cmds.fsspec.box": [], + "unstructured.ingest.cli.cmds.fsspec.dropbox": [], + "unstructured.ingest.cli.cmds.fsspec.fsspec": [], + "unstructured.ingest.cli.cmds.fsspec.gcs": [], + "unstructured.ingest.cli.cmds.fsspec.s3": [], + "unstructured.ingest.cli.cmds.fsspec.sftp": [], + "unstructured.ingest.cli.cmds.github": [], + "unstructured.ingest.cli.cmds.gitlab": [], + "unstructured.ingest.cli.cmds.google_drive": [], + "unstructured.ingest.cli.cmds.hubspot": [], + "unstructured.ingest.cli.cmds.jira": [], + "unstructured.ingest.cli.cmds.kafka": [], + "unstructured.ingest.cli.cmds.local": [], + "unstructured.ingest.cli.cmds.mongodb": [], + "unstructured.ingest.cli.cmds.notion": [], + "unstructured.ingest.cli.cmds.onedrive": [], + "unstructured.ingest.cli.cmds.opensearch": [], + "unstructured.ingest.cli.cmds.outlook": [], + "unstructured.ingest.cli.cmds.pinecone": [], + "unstructured.ingest.cli.cmds.qdrant": [], + "unstructured.ingest.cli.cmds.reddit": [], + "unstructured.ingest.cli.cmds.salesforce": [], + "unstructured.ingest.cli.cmds.sharepoint": [], + "unstructured.ingest.cli.cmds.slack": [], + "unstructured.ingest.cli.cmds.sql": [], + "unstructured.ingest.cli.cmds.vectara": [], + "unstructured.ingest.cli.cmds.weaviate": [], + "unstructured.ingest.cli.cmds.wikipedia": [], + "unstructured.ingest.cli.common": [], + "unstructured.ingest.cli.interfaces": [], + "unstructured.ingest.cli.utils": [], + "unstructured.ingest.connector": [], + "unstructured.ingest.connector.airtable": [], + "unstructured.ingest.connector.astra": [], + "unstructured.ingest.connector.azure_cognitive_search": [], + "unstructured.ingest.connector.biomed": [], + "unstructured.ingest.connector.chroma": [], + "unstructured.ingest.connector.clarifai": [], + "unstructured.ingest.connector.confluence": [], + "unstructured.ingest.connector.databricks_volumes": [], + "unstructured.ingest.connector.delta_table": [], + "unstructured.ingest.connector.discord": [], + "unstructured.ingest.connector.elasticsearch": [], + "unstructured.ingest.connector.fsspec": [], + "unstructured.ingest.connector.fsspec.azure": [], + "unstructured.ingest.connector.fsspec.box": [], + "unstructured.ingest.connector.fsspec.dropbox": [], + "unstructured.ingest.connector.fsspec.fsspec": [], + "unstructured.ingest.connector.fsspec.gcs": [], + "unstructured.ingest.connector.fsspec.s3": [], + "unstructured.ingest.connector.fsspec.sftp": [], + "unstructured.ingest.connector.git": [], + "unstructured.ingest.connector.github": [], + "unstructured.ingest.connector.gitlab": [], + "unstructured.ingest.connector.google_drive": [], + "unstructured.ingest.connector.hubspot": [], + "unstructured.ingest.connector.jira": [], + "unstructured.ingest.connector.kafka": [], + "unstructured.ingest.connector.local": [], + "unstructured.ingest.connector.mongodb": [], + "unstructured.ingest.connector.notion": [], + "unstructured.ingest.connector.notion.client": [], + "unstructured.ingest.connector.notion.connector": [], + "unstructured.ingest.connector.notion.helpers": [], + "unstructured.ingest.connector.notion.interfaces": [], + "unstructured.ingest.connector.notion.types": [], + "unstructured.ingest.connector.notion.types.block": [], + "unstructured.ingest.connector.notion.types.blocks": [], + "unstructured.ingest.connector.notion.types.blocks.bookmark": [], + "unstructured.ingest.connector.notion.types.blocks.breadcrumb": [], + "unstructured.ingest.connector.notion.types.blocks.bulleted_list_item": [], + "unstructured.ingest.connector.notion.types.blocks.callout": [], + "unstructured.ingest.connector.notion.types.blocks.child_database": [], + "unstructured.ingest.connector.notion.types.blocks.child_page": [], + "unstructured.ingest.connector.notion.types.blocks.code": [], + "unstructured.ingest.connector.notion.types.blocks.column_list": [], + "unstructured.ingest.connector.notion.types.blocks.divider": [], + "unstructured.ingest.connector.notion.types.blocks.embed": [], + "unstructured.ingest.connector.notion.types.blocks.equation": [], + "unstructured.ingest.connector.notion.types.blocks.file": [], + "unstructured.ingest.connector.notion.types.blocks.heading": [], + "unstructured.ingest.connector.notion.types.blocks.image": [], + "unstructured.ingest.connector.notion.types.blocks.link_preview": [], + "unstructured.ingest.connector.notion.types.blocks.link_to_page": [], + "unstructured.ingest.connector.notion.types.blocks.numbered_list": [], + "unstructured.ingest.connector.notion.types.blocks.paragraph": [], + "unstructured.ingest.connector.notion.types.blocks.pdf": [], + "unstructured.ingest.connector.notion.types.blocks.quote": [], + "unstructured.ingest.connector.notion.types.blocks.synced_block": [], + "unstructured.ingest.connector.notion.types.blocks.table": [], + "unstructured.ingest.connector.notion.types.blocks.table_of_contents": [], + "unstructured.ingest.connector.notion.types.blocks.template": [], + "unstructured.ingest.connector.notion.types.blocks.todo": [], + "unstructured.ingest.connector.notion.types.blocks.toggle": [], + "unstructured.ingest.connector.notion.types.blocks.unsupported": [], + "unstructured.ingest.connector.notion.types.blocks.video": [], + "unstructured.ingest.connector.notion.types.database": [], + "unstructured.ingest.connector.notion.types.database_properties": [], + "unstructured.ingest.connector.notion.types.database_properties.checkbox": [], + "unstructured.ingest.connector.notion.types.database_properties.created_by": [], + "unstructured.ingest.connector.notion.types.database_properties.created_time": [], + "unstructured.ingest.connector.notion.types.database_properties.date": [], + "unstructured.ingest.connector.notion.types.database_properties.email": [], + "unstructured.ingest.connector.notion.types.database_properties.files": [], + "unstructured.ingest.connector.notion.types.database_properties.formula": [], + "unstructured.ingest.connector.notion.types.database_properties.last_edited_by": [], + "unstructured.ingest.connector.notion.types.database_properties.last_edited_time": [], + "unstructured.ingest.connector.notion.types.database_properties.multiselect": [], + "unstructured.ingest.connector.notion.types.database_properties.number": [], + "unstructured.ingest.connector.notion.types.database_properties.people": [], + "unstructured.ingest.connector.notion.types.database_properties.phone_number": [], + "unstructured.ingest.connector.notion.types.database_properties.relation": [], + "unstructured.ingest.connector.notion.types.database_properties.rich_text": [], + "unstructured.ingest.connector.notion.types.database_properties.rollup": [], + "unstructured.ingest.connector.notion.types.database_properties.select": [], + "unstructured.ingest.connector.notion.types.database_properties.status": [], + "unstructured.ingest.connector.notion.types.database_properties.title": [], + "unstructured.ingest.connector.notion.types.database_properties.unique_id": [], + "unstructured.ingest.connector.notion.types.database_properties.url": [], + "unstructured.ingest.connector.notion.types.database_properties.verification": [], + "unstructured.ingest.connector.notion.types.date": [], + "unstructured.ingest.connector.notion.types.file": [], + "unstructured.ingest.connector.notion.types.page": [], + "unstructured.ingest.connector.notion.types.parent": [], + "unstructured.ingest.connector.notion.types.rich_text": [], + "unstructured.ingest.connector.notion.types.user": [], + "unstructured.ingest.connector.onedrive": [], + "unstructured.ingest.connector.opensearch": [], + "unstructured.ingest.connector.outlook": [], + "unstructured.ingest.connector.pinecone": [], + "unstructured.ingest.connector.qdrant": [], + "unstructured.ingest.connector.reddit": [], + "unstructured.ingest.connector.registry": [], + "unstructured.ingest.connector.salesforce": [], + "unstructured.ingest.connector.sharepoint": [], + "unstructured.ingest.connector.slack": [], + "unstructured.ingest.connector.sql": [], + "unstructured.ingest.connector.vectara": [], + "unstructured.ingest.connector.weaviate": [], + "unstructured.ingest.connector.wikipedia": [], + "unstructured.ingest.enhanced_dataclass": [], + "unstructured.ingest.enhanced_dataclass.core": [], + "unstructured.ingest.enhanced_dataclass.dataclasses": [], + "unstructured.ingest.enhanced_dataclass.json_mixin": [], + "unstructured.ingest.error": [], + "unstructured.ingest.evaluate": [], + "unstructured.ingest.ingest_backoff": [], + "unstructured.ingest.ingest_backoff._common": [], + "unstructured.ingest.ingest_backoff._wrapper": [], + "unstructured.ingest.interfaces": [], + "unstructured.ingest.logger": [], + "unstructured.ingest.main": [], + "unstructured.ingest.pipeline": [], + "unstructured.ingest.pipeline.copy": [], + "unstructured.ingest.pipeline.doc_factory": [], + "unstructured.ingest.pipeline.interfaces": [], + "unstructured.ingest.pipeline.partition": [], + "unstructured.ingest.pipeline.permissions": [], + "unstructured.ingest.pipeline.pipeline": [], + "unstructured.ingest.pipeline.reformat": [], + "unstructured.ingest.pipeline.reformat.chunking": [], + "unstructured.ingest.pipeline.reformat.embedding": [], + "unstructured.ingest.pipeline.source": [], + "unstructured.ingest.pipeline.utils": [], + "unstructured.ingest.pipeline.write": [], + "unstructured.ingest.processor": [], + "unstructured.ingest.runner": [], + "unstructured.ingest.runner.airtable": [], + "unstructured.ingest.runner.base_runner": [], + "unstructured.ingest.runner.biomed": [], + "unstructured.ingest.runner.confluence": [], + "unstructured.ingest.runner.delta_table": [], + "unstructured.ingest.runner.discord": [], + "unstructured.ingest.runner.elasticsearch": [], + "unstructured.ingest.runner.fsspec": [], + "unstructured.ingest.runner.fsspec.azure": [], + "unstructured.ingest.runner.fsspec.box": [], + "unstructured.ingest.runner.fsspec.dropbox": [], + "unstructured.ingest.runner.fsspec.fsspec": [], + "unstructured.ingest.runner.fsspec.gcs": [], + "unstructured.ingest.runner.fsspec.s3": [], + "unstructured.ingest.runner.fsspec.sftp": [], + "unstructured.ingest.runner.github": [], + "unstructured.ingest.runner.gitlab": [], + "unstructured.ingest.runner.google_drive": [], + "unstructured.ingest.runner.hubspot": [], + "unstructured.ingest.runner.jira": [], + "unstructured.ingest.runner.kafka": [], + "unstructured.ingest.runner.local": [], + "unstructured.ingest.runner.mongodb": [], + "unstructured.ingest.runner.notion": [], + "unstructured.ingest.runner.onedrive": [], + "unstructured.ingest.runner.opensearch": [], + "unstructured.ingest.runner.outlook": [], + "unstructured.ingest.runner.reddit": [], + "unstructured.ingest.runner.salesforce": [], + "unstructured.ingest.runner.sharepoint": [], + "unstructured.ingest.runner.slack": [], + "unstructured.ingest.runner.utils": [], + "unstructured.ingest.runner.wikipedia": [], + "unstructured.ingest.runner.writers": [], + "unstructured.ingest.runner.writers.astra": [], + "unstructured.ingest.runner.writers.azure_cognitive_search": [], + "unstructured.ingest.runner.writers.base_writer": [], + "unstructured.ingest.runner.writers.chroma": [], + "unstructured.ingest.runner.writers.clarifai": [], + "unstructured.ingest.runner.writers.databricks_volumes": [], + "unstructured.ingest.runner.writers.delta_table": [], + "unstructured.ingest.runner.writers.elasticsearch": [], + "unstructured.ingest.runner.writers.fsspec": [], + "unstructured.ingest.runner.writers.fsspec.azure": [], + "unstructured.ingest.runner.writers.fsspec.box": [], + "unstructured.ingest.runner.writers.fsspec.dropbox": [], + "unstructured.ingest.runner.writers.fsspec.gcs": [], + "unstructured.ingest.runner.writers.fsspec.s3": [], + "unstructured.ingest.runner.writers.kafka": [], + "unstructured.ingest.runner.writers.mongodb": [], + "unstructured.ingest.runner.writers.opensearch": [], + "unstructured.ingest.runner.writers.pinecone": [], + "unstructured.ingest.runner.writers.qdrant": [], + "unstructured.ingest.runner.writers.sql": [], + "unstructured.ingest.runner.writers.vectara": [], + "unstructured.ingest.runner.writers.weaviate": [], + "unstructured.ingest.utils": [], + "unstructured.ingest.utils.compression": [], + "unstructured.ingest.utils.data_prep": [], + "unstructured.ingest.utils.string_and_date_utils": [], + "unstructured.ingest.utils.table": [], + "unstructured.ingest.v2": [], + "unstructured.ingest.v2.cli": [], + "unstructured.ingest.v2.cli.base": [], + "unstructured.ingest.v2.cli.base.cmd": [], + "unstructured.ingest.v2.cli.base.dest": [], + "unstructured.ingest.v2.cli.base.src": [], + "unstructured.ingest.v2.cli.cli": [], + "unstructured.ingest.v2.cli.cmds": [], + "unstructured.ingest.v2.cli.cmds.chroma": [], + "unstructured.ingest.v2.cli.cmds.elasticsearch": [], + "unstructured.ingest.v2.cli.cmds.fsspec": [], + "unstructured.ingest.v2.cli.cmds.fsspec.azure": [], + "unstructured.ingest.v2.cli.cmds.fsspec.box": [], + "unstructured.ingest.v2.cli.cmds.fsspec.dropbox": [], + "unstructured.ingest.v2.cli.cmds.fsspec.fsspec": [], + "unstructured.ingest.v2.cli.cmds.fsspec.gcs": [], + "unstructured.ingest.v2.cli.cmds.fsspec.s3": [], + "unstructured.ingest.v2.cli.cmds.fsspec.sftp": [], + "unstructured.ingest.v2.cli.cmds.local": [], + "unstructured.ingest.v2.cli.cmds.weaviate": [], + "unstructured.ingest.v2.cli.configs": [], + "unstructured.ingest.v2.cli.configs.chunk": [], + "unstructured.ingest.v2.cli.configs.embed": [], + "unstructured.ingest.v2.cli.configs.partition": [], + "unstructured.ingest.v2.cli.configs.processor": [], + "unstructured.ingest.v2.cli.interfaces": [], + "unstructured.ingest.v2.cli.utils": [], + "unstructured.ingest.v2.example": [], + "unstructured.ingest.v2.interfaces": [], + "unstructured.ingest.v2.interfaces.connector": [], + "unstructured.ingest.v2.interfaces.downloader": [], + "unstructured.ingest.v2.interfaces.file_data": [], + "unstructured.ingest.v2.interfaces.indexer": [], + "unstructured.ingest.v2.interfaces.process": [], + "unstructured.ingest.v2.interfaces.processor": [], + "unstructured.ingest.v2.interfaces.upload_stager": [], + "unstructured.ingest.v2.interfaces.uploader": [], + "unstructured.ingest.v2.logger": [], + "unstructured.ingest.v2.main": [], + "unstructured.ingest.v2.pipeline": [], + "unstructured.ingest.v2.pipeline.interfaces": [], + "unstructured.ingest.v2.pipeline.pipeline": [], + "unstructured.ingest.v2.pipeline.steps": [], + "unstructured.ingest.v2.pipeline.steps.chunk": [], + "unstructured.ingest.v2.pipeline.steps.download": [], + "unstructured.ingest.v2.pipeline.steps.embed": [], + "unstructured.ingest.v2.pipeline.steps.index": [], + "unstructured.ingest.v2.pipeline.steps.partition": [], + "unstructured.ingest.v2.pipeline.steps.stage": [], + "unstructured.ingest.v2.pipeline.steps.uncompress": [], + "unstructured.ingest.v2.pipeline.steps.upload": [], + "unstructured.ingest.v2.pipeline.utils": [], + "unstructured.ingest.v2.processes": [], + "unstructured.ingest.v2.processes.chunker": [], + "unstructured.ingest.v2.processes.connector_registry": [], + "unstructured.ingest.v2.processes.connectors": [], + "unstructured.ingest.v2.processes.connectors.chroma": [], + "unstructured.ingest.v2.processes.connectors.elasticsearch": [], + "unstructured.ingest.v2.processes.connectors.fsspec": [], + "unstructured.ingest.v2.processes.connectors.fsspec.azure": [], + "unstructured.ingest.v2.processes.connectors.fsspec.box": [], + "unstructured.ingest.v2.processes.connectors.fsspec.dropbox": [], + "unstructured.ingest.v2.processes.connectors.fsspec.fsspec": [], + "unstructured.ingest.v2.processes.connectors.fsspec.gcs": [], + "unstructured.ingest.v2.processes.connectors.fsspec.s3": [], + "unstructured.ingest.v2.processes.connectors.fsspec.sftp": [], + "unstructured.ingest.v2.processes.connectors.fsspec.utils": [], + "unstructured.ingest.v2.processes.connectors.local": [], + "unstructured.ingest.v2.processes.connectors.weaviate": [], + "unstructured.ingest.v2.processes.embedder": [], + "unstructured.ingest.v2.processes.partitioner": [], + "unstructured.ingest.v2.processes.uncompress": [], + "unstructured.logger": [], + "unstructured.metrics": [], + "unstructured.metrics.element_type": [], + "unstructured.metrics.evaluate": [], + "unstructured.metrics.table": [], + "unstructured.metrics.table.table_alignment": [], + "unstructured.metrics.table.table_eval": [], + "unstructured.metrics.table.table_extraction": [], + "unstructured.metrics.table.table_formats": [], + "unstructured.metrics.table_structure": [], + "unstructured.metrics.text_extraction": [], + "unstructured.metrics.utils": [], + "unstructured.models": [], + "unstructured.nlp": [], + "unstructured.nlp.english_words": [], + "unstructured.nlp.partition": [], + "unstructured.nlp.patterns": [], + "unstructured.nlp.tokenize": [], + "unstructured.partition": [], + "unstructured.partition.api": [], + "unstructured.partition.auto": [], + "unstructured.partition.common": [], + "unstructured.partition.csv": [], + "unstructured.partition.doc": [], + "unstructured.partition.docx": [], + "unstructured.partition.email": [], + "unstructured.partition.epub": [], + "unstructured.partition.html": [], + "unstructured.partition.html.parser": [], + "unstructured.partition.html.partition": [], + "unstructured.partition.image": [], + "unstructured.partition.json": [], + "unstructured.partition.lang": [], + "unstructured.partition.md": [], + "unstructured.partition.model_init": [], + "unstructured.partition.msg": [], + "unstructured.partition.odt": [], + "unstructured.partition.org": [], + "unstructured.partition.pdf": [], + "unstructured.partition.pdf_image": [], + "unstructured.partition.pdf_image.form_extraction": [], + "unstructured.partition.pdf_image.inference_utils": [], + "unstructured.partition.pdf_image.ocr": [], + "unstructured.partition.pdf_image.pdf_image_utils": [], + "unstructured.partition.pdf_image.pdfminer_processing": [], + "unstructured.partition.pdf_image.pdfminer_utils": [], + "unstructured.partition.pdf_image.pypdf_utils": [], + "unstructured.partition.ppt": [], + "unstructured.partition.pptx": [], + "unstructured.partition.rst": [], + "unstructured.partition.rtf": [], + "unstructured.partition.strategies": [], + "unstructured.partition.text": [], + "unstructured.partition.text_type": [], + "unstructured.partition.tsv": [], + "unstructured.partition.utils": [], + "unstructured.partition.utils.config": [], + "unstructured.partition.utils.constants": [], + "unstructured.partition.utils.ocr_models": [], + "unstructured.partition.utils.ocr_models.google_vision_ocr": [], + "unstructured.partition.utils.ocr_models.ocr_interface": [], + "unstructured.partition.utils.ocr_models.paddle_ocr": [], + "unstructured.partition.utils.ocr_models.tesseract_ocr": [], + "unstructured.partition.utils.sorting": [], + "unstructured.partition.utils.xycut": [], + "unstructured.partition.xlsx": [], + "unstructured.partition.xml": [], + "unstructured.patches": [], + "unstructured.patches.pdfminer": [], + "unstructured.staging": [], + "unstructured.staging.argilla": [], + "unstructured.staging.base": [], + "unstructured.staging.baseplate": [], + "unstructured.staging.datasaur": [], + "unstructured.staging.huggingface": [], + "unstructured.staging.label_box": [], + "unstructured.staging.label_studio": [], + "unstructured.staging.prodigy": [], + "unstructured.staging.weaviate": [], + "unstructured.utils": [] + }, + "unstructured-client": { + "unstructured_client": [], + "unstructured_client._hooks": [], + "unstructured_client._hooks.custom": [], + "unstructured_client._hooks.custom.clean_server_url_hook": [], + "unstructured_client._hooks.custom.common": [], + "unstructured_client._hooks.custom.form_utils": [], + "unstructured_client._hooks.custom.logger_hook": [], + "unstructured_client._hooks.custom.pdf_utils": [], + "unstructured_client._hooks.custom.request_utils": [], + "unstructured_client._hooks.custom.split_pdf_hook": [], + "unstructured_client._hooks.custom.suggest_defining_url": [], + "unstructured_client._hooks.registration": [], + "unstructured_client._hooks.sdkhooks": [], + "unstructured_client._hooks.types": [], + "unstructured_client.general": [], + "unstructured_client.models": [], + "unstructured_client.models.errors": [], + "unstructured_client.models.errors.httpvalidationerror": [], + "unstructured_client.models.errors.sdkerror": [], + "unstructured_client.models.errors.servererror": [], + "unstructured_client.models.operations": [], + "unstructured_client.models.operations.partition": [], + "unstructured_client.models.shared": [], + "unstructured_client.models.shared.partition_parameters": [], + "unstructured_client.models.shared.security": [], + "unstructured_client.models.shared.validationerror": [], + "unstructured_client.sdk": [], + "unstructured_client.sdkconfiguration": [], + "unstructured_client.utils": [], + "unstructured_client.utils.enums": [], + "unstructured_client.utils.retries": [], + "unstructured_client.utils.utils": [] + }, "urllib3": { "urllib3": [] },