diff --git a/platform/supported-file-types.mdx b/platform/supported-file-types.mdx index 740aba45..c250657b 100644 --- a/platform/supported-file-types.mdx +++ b/platform/supported-file-types.mdx @@ -2,6 +2,6 @@ title: Supported file types --- -import SupportedFileTypes from '/snippets/general-shared-text/supported-file-types.mdx'; +import SupportedFileTypesPlatform from '/snippets/general-shared-text/supported-file-types-platform.mdx'; - \ No newline at end of file + \ No newline at end of file diff --git a/snippets/general-shared-text/supported-file-types-platform.mdx b/snippets/general-shared-text/supported-file-types-platform.mdx new file mode 100644 index 00000000..7f32dc99 --- /dev/null +++ b/snippets/general-shared-text/supported-file-types-platform.mdx @@ -0,0 +1,94 @@ +The Unstructured Platform supports processing of the following file types: + +By file extension: + +| File extension | +| --- | +| `.abw` | +| `.bmp` | +| `.csv` | +| `.cwk` | +| `.dbf` | +| `.dif` | +| `.doc` | +| `.docm` | +| `.docx` | +| `.dot` | +| `.dotm` | +| `.eml` | +| `.epub` | +| `.et` | +| `.eth` | +| `.fods` | +| `.gif` | +| `.heic` | +| `.htm` | +| `.html` | +| `.hwp` | +| `.jpeg` | +| `.jpg` | +| `.md` | +| `.mcw` | +| `.mw` | +| `.odt` | +| `.org` | +| `.p7s` | +| `.pages` | +| `.pbd` | +| `.pdf` | +| `.png` | +| `.pot` | +| `.potm` | +| `.ppt` | +| `.pptm` | +| `.pptx` | +| `.prn` | +| `.rst` | +| `.rtf` | +| `.sdp` | +| `.sgl` | +| `.svg` | +| `.sxg` | +| `.tiff` | +| `.txt` | +| `.tsv` | +| `.uof` | +| `.uos1` | +| `.uos2` | +| `.web` | +| `.webp` | +| `.wk2` | +| `.xls` | +| `.xlsb` | +| `.xlsm` | +| `.xlsx` | +| `.xlw` | +| `.xml` | +| `.zabw` | + +By file type: + +| Category | File types | +| --- | --- | +| Apple | `.cwk`, `.mcw`, `.pages` +| CSV | `.csv` | +| Data interchange | `.dif` | +| dBase | `.dbf` | +| E-mail | `.eml`, `.p7s` | +| EPUB | `.epub` | +| HTML | `.htm`, `.html` | +| Image | `.bmp`, `.gif`, `.heic`, `.jpeg`, `.jpg`, `.png`, `.prn`, `.svg`, `.tiff`, `.webp` | +| Markdown | `.md` | +| Org Mode | `.org` | +| Open Office | `.odt`, `.sgl` | +| Other | `.eth`, `.mw`, `.pbd`, `.sdp`, `.uof`, `.web` | +| PDF | `.pdf` | +| Plain text | `.txt` | +| PowerPoint | `.pot`, `.potm`, `.ppt`, `.pptm`, `.pptx` | +| reStructured Text | `.rst` | +| Rich Text | `.rtf` | +| Spreadsheet | `.et`, `.fods`, `.uos1`, `.uos2`, `.wk2`, `.xls`, `.xlsb`, `.xlsm`, `.xlsx`, `.xlw` | +| StarOffice | `.sxg` | +| TSV | `.tsv` | +| Word processing | `.abw`, `.doc`, `.docm`, `.docx`, `.dot`, `.dotm`, `.hwp`, `.zabw` | +| XML | `.xml` |