LICENSE.md
MANIFEST.in
README.md
pyproject.toml
setup.cfg
setup.py
requirements/base.in
requirements/huggingface.in
test_unstructured/__init__.py
test_unstructured/test_utils.py
test_unstructured/unit_utils.py
test_unstructured/nlp/__init__.py
test_unstructured/nlp/mock_nltk.py
test_unstructured/nlp/test_partition.py
test_unstructured/nlp/test_tokenize.py
test_unstructured/partition/__init__.py
test_unstructured/partition/test_api.py
test_unstructured/partition/test_auto.py
test_unstructured/partition/test_common.py
test_unstructured/partition/test_constants.py
test_unstructured/partition/test_email.py
test_unstructured/partition/test_html_partition.py
test_unstructured/partition/test_json.py
test_unstructured/partition/test_lang.py
test_unstructured/partition/test_strategies.py
test_unstructured/partition/test_text.py
test_unstructured/partition/test_text_type.py
test_unstructured/partition/test_xml_partition.py
test_unstructured/partition/csv/__init__.py
test_unstructured/partition/csv/test_csv.py
test_unstructured/partition/csv/test_tsv.py
test_unstructured/partition/docx/__init__.py
test_unstructured/partition/docx/test_doc.py
test_unstructured/partition/docx/test_docx.py
test_unstructured/partition/epub/__init__.py
test_unstructured/partition/epub/test_epub.py
test_unstructured/partition/markdown/__init__.py
test_unstructured/partition/markdown/test_md.py
test_unstructured/partition/msg/__init__.py
test_unstructured/partition/msg/test_msg.py
test_unstructured/partition/odt/__init__.py
test_unstructured/partition/odt/test_odt.py
test_unstructured/partition/pdf_image/__init__.py
test_unstructured/partition/pdf_image/test_chipper.py
test_unstructured/partition/pdf_image/test_image.py
test_unstructured/partition/pdf_image/test_ocr.py
test_unstructured/partition/pdf_image/test_pdf.py
test_unstructured/partition/pptx/__init__.py
test_unstructured/partition/pptx/test_ppt.py
test_unstructured/partition/pptx/test_pptx.py
test_unstructured/partition/pypandoc/__init__.py
test_unstructured/partition/pypandoc/test_org.py
test_unstructured/partition/pypandoc/test_rst.py
test_unstructured/partition/pypandoc/test_rtf.py
test_unstructured/partition/xlsx/__init__.py
test_unstructured/partition/xlsx/test_xlsx.py
unstructured/__init__.py
unstructured/__version__.py
unstructured/logger.py
unstructured/utils.py
unstructured.egg-info/PKG-INFO
unstructured.egg-info/SOURCES.txt
unstructured.egg-info/dependency_links.txt
unstructured.egg-info/entry_points.txt
unstructured.egg-info/requires.txt
unstructured.egg-info/top_level.txt
unstructured/chunking/__init__.py
unstructured/chunking/title.py
unstructured/cleaners/__init__.py
unstructured/cleaners/core.py
unstructured/cleaners/extract.py
unstructured/cleaners/translate.py
unstructured/documents/__init__.py
unstructured/documents/base.py
unstructured/documents/coordinates.py
unstructured/documents/elements.py
unstructured/documents/email_elements.py
unstructured/documents/html.py
unstructured/documents/xml.py
unstructured/embed/__init__.py
unstructured/embed/bedrock.py
unstructured/embed/huggingface.py
unstructured/embed/interfaces.py
unstructured/embed/openai.py
unstructured/file_utils/__init__.py
unstructured/file_utils/encoding.py
unstructured/file_utils/exploration.py
unstructured/file_utils/file_conversion.py
unstructured/file_utils/filetype.py
unstructured/file_utils/google_filetype.py
unstructured/file_utils/metadata.py
unstructured/ingest/__init__.py
unstructured/ingest/error.py
unstructured/ingest/evaluate.py
unstructured/ingest/interfaces.py
unstructured/ingest/logger.py
unstructured/ingest/main.py
unstructured/ingest/processor.py
unstructured/ingest/cli/__init__.py
unstructured/ingest/cli/cli.py
unstructured/ingest/cli/cmd_factory.py
unstructured/ingest/cli/common.py
unstructured/ingest/cli/interfaces.py
unstructured/ingest/cli/utils.py
unstructured/ingest/cli/base/__init__.py
unstructured/ingest/cli/base/cmd.py
unstructured/ingest/cli/base/dest.py
unstructured/ingest/cli/base/src.py
unstructured/ingest/cli/cmds/__init__.py
unstructured/ingest/cli/cmds/airtable.py
unstructured/ingest/cli/cmds/azure.py
unstructured/ingest/cli/cmds/azure_cognitive_search.py
unstructured/ingest/cli/cmds/biomed.py
unstructured/ingest/cli/cmds/box.py
unstructured/ingest/cli/cmds/confluence.py
unstructured/ingest/cli/cmds/delta_table.py
unstructured/ingest/cli/cmds/discord.py
unstructured/ingest/cli/cmds/dropbox.py
unstructured/ingest/cli/cmds/elasticsearch.py
unstructured/ingest/cli/cmds/fsspec.py
unstructured/ingest/cli/cmds/gcs.py
unstructured/ingest/cli/cmds/github.py
unstructured/ingest/cli/cmds/gitlab.py
unstructured/ingest/cli/cmds/google_drive.py
unstructured/ingest/cli/cmds/hubspot.py
unstructured/ingest/cli/cmds/jira.py
unstructured/ingest/cli/cmds/local.py
unstructured/ingest/cli/cmds/mongodb.py
unstructured/ingest/cli/cmds/notion.py
unstructured/ingest/cli/cmds/onedrive.py
unstructured/ingest/cli/cmds/outlook.py
unstructured/ingest/cli/cmds/reddit.py
unstructured/ingest/cli/cmds/s3.py
unstructured/ingest/cli/cmds/salesforce.py
unstructured/ingest/cli/cmds/sharepoint.py
unstructured/ingest/cli/cmds/slack.py
unstructured/ingest/cli/cmds/wikipedia.py
unstructured/ingest/connector/__init__.py
unstructured/ingest/connector/airtable.py
unstructured/ingest/connector/azure.py
unstructured/ingest/connector/azure_cognitive_search.py
unstructured/ingest/connector/biomed.py
unstructured/ingest/connector/box.py
unstructured/ingest/connector/confluence.py
unstructured/ingest/connector/delta_table.py
unstructured/ingest/connector/discord.py
unstructured/ingest/connector/dropbox.py
unstructured/ingest/connector/elasticsearch.py
unstructured/ingest/connector/fsspec.py
unstructured/ingest/connector/gcs.py
unstructured/ingest/connector/git.py
unstructured/ingest/connector/github.py
unstructured/ingest/connector/gitlab.py
unstructured/ingest/connector/google_drive.py
unstructured/ingest/connector/hubspot.py
unstructured/ingest/connector/jira.py
unstructured/ingest/connector/local.py
unstructured/ingest/connector/mongodb.py
unstructured/ingest/connector/onedrive.py
unstructured/ingest/connector/outlook.py
unstructured/ingest/connector/reddit.py
unstructured/ingest/connector/registry.py
unstructured/ingest/connector/s3.py
unstructured/ingest/connector/salesforce.py
unstructured/ingest/connector/sharepoint.py
unstructured/ingest/connector/slack.py
unstructured/ingest/connector/wikipedia.py
unstructured/ingest/connector/notion/__init__.py
unstructured/ingest/connector/notion/client.py
unstructured/ingest/connector/notion/connector.py
unstructured/ingest/connector/notion/helpers.py
unstructured/ingest/connector/notion/interfaces.py
unstructured/ingest/connector/notion/types/__init__.py
unstructured/ingest/connector/notion/types/block.py
unstructured/ingest/connector/notion/types/database.py
unstructured/ingest/connector/notion/types/date.py
unstructured/ingest/connector/notion/types/file.py
unstructured/ingest/connector/notion/types/page.py
unstructured/ingest/connector/notion/types/parent.py
unstructured/ingest/connector/notion/types/rich_text.py
unstructured/ingest/connector/notion/types/user.py
unstructured/ingest/connector/notion/types/blocks/__init__.py
unstructured/ingest/connector/notion/types/blocks/bookmark.py
unstructured/ingest/connector/notion/types/blocks/breadcrumb.py
unstructured/ingest/connector/notion/types/blocks/bulleted_list_item.py
unstructured/ingest/connector/notion/types/blocks/callout.py
unstructured/ingest/connector/notion/types/blocks/child_database.py
unstructured/ingest/connector/notion/types/blocks/child_page.py
unstructured/ingest/connector/notion/types/blocks/code.py
unstructured/ingest/connector/notion/types/blocks/column_list.py
unstructured/ingest/connector/notion/types/blocks/divider.py
unstructured/ingest/connector/notion/types/blocks/embed.py
unstructured/ingest/connector/notion/types/blocks/equation.py
unstructured/ingest/connector/notion/types/blocks/file.py
unstructured/ingest/connector/notion/types/blocks/heading.py
unstructured/ingest/connector/notion/types/blocks/image.py
unstructured/ingest/connector/notion/types/blocks/link_preview.py
unstructured/ingest/connector/notion/types/blocks/link_to_page.py
unstructured/ingest/connector/notion/types/blocks/numbered_list.py
unstructured/ingest/connector/notion/types/blocks/paragraph.py
unstructured/ingest/connector/notion/types/blocks/pdf.py
unstructured/ingest/connector/notion/types/blocks/quote.py
unstructured/ingest/connector/notion/types/blocks/synced_block.py
unstructured/ingest/connector/notion/types/blocks/table.py
unstructured/ingest/connector/notion/types/blocks/table_of_contents.py
unstructured/ingest/connector/notion/types/blocks/template.py
unstructured/ingest/connector/notion/types/blocks/todo.py
unstructured/ingest/connector/notion/types/blocks/toggle.py
unstructured/ingest/connector/notion/types/blocks/unsupported.py
unstructured/ingest/connector/notion/types/blocks/video.py
unstructured/ingest/connector/notion/types/database_properties/__init__.py
unstructured/ingest/connector/notion/types/database_properties/checkbox.py
unstructured/ingest/connector/notion/types/database_properties/created_by.py
unstructured/ingest/connector/notion/types/database_properties/created_time.py
unstructured/ingest/connector/notion/types/database_properties/date.py
unstructured/ingest/connector/notion/types/database_properties/email.py
unstructured/ingest/connector/notion/types/database_properties/files.py
unstructured/ingest/connector/notion/types/database_properties/formula.py
unstructured/ingest/connector/notion/types/database_properties/last_edited_by.py
unstructured/ingest/connector/notion/types/database_properties/last_edited_time.py
unstructured/ingest/connector/notion/types/database_properties/multiselect.py
unstructured/ingest/connector/notion/types/database_properties/number.py
unstructured/ingest/connector/notion/types/database_properties/people.py
unstructured/ingest/connector/notion/types/database_properties/phone_number.py
unstructured/ingest/connector/notion/types/database_properties/relation.py
unstructured/ingest/connector/notion/types/database_properties/rich_text.py
unstructured/ingest/connector/notion/types/database_properties/rollup.py
unstructured/ingest/connector/notion/types/database_properties/select.py
unstructured/ingest/connector/notion/types/database_properties/status.py
unstructured/ingest/connector/notion/types/database_properties/title.py
unstructured/ingest/connector/notion/types/database_properties/unique_id.py
unstructured/ingest/connector/notion/types/database_properties/url.py
unstructured/ingest/connector/notion/types/database_properties/verification.py
unstructured/ingest/ingest_backoff/__init__.py
unstructured/ingest/ingest_backoff/_common.py
unstructured/ingest/ingest_backoff/_wrapper.py
unstructured/ingest/pipeline/__init__.py
unstructured/ingest/pipeline/copy.py
unstructured/ingest/pipeline/doc_factory.py
unstructured/ingest/pipeline/interfaces.py
unstructured/ingest/pipeline/partition.py
unstructured/ingest/pipeline/permissions.py
unstructured/ingest/pipeline/pipeline.py
unstructured/ingest/pipeline/source.py
unstructured/ingest/pipeline/utils.py
unstructured/ingest/pipeline/write.py
unstructured/ingest/pipeline/reformat/__init__.py
unstructured/ingest/pipeline/reformat/chunking.py
unstructured/ingest/pipeline/reformat/embedding.py
unstructured/ingest/runner/__init__.py
unstructured/ingest/runner/airtable.py
unstructured/ingest/runner/azure.py
unstructured/ingest/runner/base_runner.py
unstructured/ingest/runner/biomed.py
unstructured/ingest/runner/box.py
unstructured/ingest/runner/confluence.py
unstructured/ingest/runner/delta_table.py
unstructured/ingest/runner/discord.py
unstructured/ingest/runner/dropbox.py
unstructured/ingest/runner/elasticsearch.py
unstructured/ingest/runner/fsspec.py
unstructured/ingest/runner/gcs.py
unstructured/ingest/runner/github.py
unstructured/ingest/runner/gitlab.py
unstructured/ingest/runner/google_drive.py
unstructured/ingest/runner/hubspot.py
unstructured/ingest/runner/jira.py
unstructured/ingest/runner/local.py
unstructured/ingest/runner/notion.py
unstructured/ingest/runner/onedrive.py
unstructured/ingest/runner/outlook.py
unstructured/ingest/runner/reddit.py
unstructured/ingest/runner/s3.py
unstructured/ingest/runner/salesforce.py
unstructured/ingest/runner/sharepoint.py
unstructured/ingest/runner/slack.py
unstructured/ingest/runner/utils.py
unstructured/ingest/runner/wikipedia.py
unstructured/ingest/runner/writers/__init__.py
unstructured/ingest/runner/writers/azure.py
unstructured/ingest/runner/writers/azure_cognitive_search.py
unstructured/ingest/runner/writers/box.py
unstructured/ingest/runner/writers/delta_table.py
unstructured/ingest/runner/writers/dropbox.py
unstructured/ingest/runner/writers/gcs.py
unstructured/ingest/runner/writers/mongodb.py
unstructured/ingest/runner/writers/s3.py
unstructured/ingest/utils/__init__.py
unstructured/ingest/utils/compression.py
unstructured/ingest/utils/table.py
unstructured/metrics/__init__.py
unstructured/metrics/element_type.py
unstructured/metrics/evaluate.py
unstructured/metrics/table_structure.py
unstructured/metrics/text_extraction.py
unstructured/models/__init__.py
unstructured/nlp/__init__.py
unstructured/nlp/english-words.txt
unstructured/nlp/english_words.py
unstructured/nlp/partition.py
unstructured/nlp/patterns.py
unstructured/nlp/tokenize.py
unstructured/partition/__init__.py
unstructured/partition/api.py
unstructured/partition/auto.py
unstructured/partition/common.py
unstructured/partition/csv.py
unstructured/partition/doc.py
unstructured/partition/docx.py
unstructured/partition/email.py
unstructured/partition/epub.py
unstructured/partition/html.py
unstructured/partition/image.py
unstructured/partition/json.py
unstructured/partition/lang.py
unstructured/partition/md.py
unstructured/partition/model_init.py
unstructured/partition/msg.py
unstructured/partition/ocr.py
unstructured/partition/odt.py
unstructured/partition/org.py
unstructured/partition/pdf.py
unstructured/partition/ppt.py
unstructured/partition/pptx.py
unstructured/partition/rst.py
unstructured/partition/rtf.py
unstructured/partition/strategies.py
unstructured/partition/text.py
unstructured/partition/text_type.py
unstructured/partition/tsv.py
unstructured/partition/xlsx.py
unstructured/partition/xml.py
unstructured/partition/utils/__init__.py
unstructured/partition/utils/config.py
unstructured/partition/utils/constants.py
unstructured/partition/utils/processing_elements.py
unstructured/partition/utils/sorting.py
unstructured/partition/utils/xycut.py
unstructured/partition/utils/ocr_models/__init__.py
unstructured/partition/utils/ocr_models/paddle_ocr.py
unstructured/staging/__init__.py
unstructured/staging/argilla.py
unstructured/staging/base.py
unstructured/staging/baseplate.py
unstructured/staging/datasaur.py
unstructured/staging/huggingface.py
unstructured/staging/label_box.py
unstructured/staging/label_studio.py
unstructured/staging/prodigy.py
unstructured/staging/weaviate.py