Unstructured-IO
diff --git a/‎CHANGELOG.md
+3-1 b/‎CHANGELOG.md
+3-1
diff --git a/‎test_unstructured_ingest/expected-structured-output/local-single-file-with-pdf-infer-table-structure/layout-parser-paper-with-table.json
-170 b/‎test_unstructured_ingest/expected-structured-output/local-single-file-with-pdf-infer-table-structure/layout-parser-paper-with-table.json
-170
@@ -9,11 +9,13 @@
 
 ### Fixes
 
+* **Turn off XML resolve entities** Sets `resolve_entities=False` for XML parsing with `lxml`
+  to avoid text being dynamically injected into the XML document.
 * **Add backward compatibility for the deprecated pdf_infer_table_structure parameter**.
 * **Add the missing `form_extraction_skip_tables` argument to the `partition_pdf_or_image` call**.
-* **Turn off XML resolve entities** Sets `resolve_entities=False` for XML parsing with `lxml`
   to avoid text being dynamically injected into the XML document.
 * **Chromadb change from Add to Upsert using element_id to make idempotent**
+* **Diable `table_as_cells` output by default** to reduce overhead in partition; now `table_as_cells` is only produced when the env `EXTACT_TABLE_AS_CELLS` is `true`
 * **Reduce excessive logging** Change per page ocr info level logging into detail level trace logging
 * **Replace try block in `document_to_element_list` for handling HTMLDocument** Use `getattr(element, "type", "")` to get the `type` attribute of an element when it exists. This is more explicit way to handle the special case for HTML documents and prevents other types of attribute error from being silenced by the try block
 
 
@@ -49,176 +49,6 @@
     "text": "Dataset | Base Model\" Large Model | Notes PubLayNet [38] P/M M Layouts of modern scientific documents PRImA [3) M - Layouts of scanned modern magazines and scientific reports Newspaper [17] P - Layouts of scanned US newspapers from the 20th century \u2018TableBank (18) P P Table region on modern scientific and business document HJDataset (31) | F/M - Layouts of history Japanese documents",
     "metadata": {
       "text_as_html": "<table><thead><th>Dataset</th><th>| Base Model!|</th><th>Large Model</th><th>| Notes</th></thead><tr><td>PubLayNet [33]</td><td>P/M</td><td>M</td><td>Layouts of modern scientific documents</td></tr><tr><td>PRImA [3]</td><td>M</td><td></td><td>Layouts of scanned modern magazines and scientific reports</td></tr><tr><td>Newspaper [17]</td><td>P</td><td></td><td>Layouts of scanned US newspapers from the 20th century</td></tr><tr><td>TableBank [18]</td><td>P</td><td></td><td>Table region on modern scientific and business document</td></tr><tr><td>HIDataset [31]</td><td>P/M</td><td></td><td>Layouts of history Japanese documents</td></tr></table>",
-      "table_as_cells": [
-        {
-          "x": 0,
-          "y": 0,
-          "w": 1,
-          "h": 1,
-          "content": "Dataset"
-        },
-        {
-          "x": 0,
-          "y": 1,
-          "w": 1,
-          "h": 1,
-          "content": "PubLayNet [33]"
-        },
-        {
-          "x": 0,
-          "y": 2,
-          "w": 1,
-          "h": 1,
-          "content": "PRImA [3]"
-        },
-        {
-          "x": 0,
-          "y": 3,
-          "w": 1,
-          "h": 1,
-          "content": "Newspaper [17]"
-        },
-        {
-          "x": 0,
-          "y": 4,
-          "w": 1,
-          "h": 1,
-          "content": "TableBank [18]"
-        },
-        {
-          "x": 0,
-          "y": 5,
-          "w": 1,
-          "h": 1,
-          "content": "HIDataset [31]"
-        },
-        {
-          "x": 1,
-          "y": 0,
-          "w": 1,
-          "h": 1,
-          "content": "| Base Model!|"
-        },
-        {
-          "x": 1,
-          "y": 1,
-          "w": 1,
-          "h": 1,
-          "content": "P/M"
-        },
-        {
-          "x": 1,
-          "y": 2,
-          "w": 1,
-          "h": 1,
-          "content": "M"
-        },
-        {
-          "x": 1,
-          "y": 3,
-          "w": 1,
-          "h": 1,
-          "content": "P"
-        },
-        {
-          "x": 1,
-          "y": 4,
-          "w": 1,
-          "h": 1,
-          "content": "P"
-        },
-        {
-          "x": 1,
-          "y": 5,
-          "w": 1,
-          "h": 1,
-          "content": "P/M"
-        },
-        {
-          "x": 2,
-          "y": 0,
-          "w": 1,
-          "h": 1,
-          "content": "Large Model"
-        },
-        {
-          "x": 2,
-          "y": 1,
-          "w": 1,
-          "h": 1,
-          "content": "M"
-        },
-        {
-          "x": 2,
-          "y": 2,
-          "w": 1,
-          "h": 1,
-          "content": ""
-        },
-        {
-          "x": 2,
-          "y": 3,
-          "w": 1,
-          "h": 1,
-          "content": ""
-        },
-        {
-          "x": 2,
-          "y": 4,
-          "w": 1,
-          "h": 1,
-          "content": ""
-        },
-        {
-          "x": 2,
-          "y": 5,
-          "w": 1,
-          "h": 1,
-          "content": ""
-        },
-        {
-          "x": 3,
-          "y": 0,
-          "w": 1,
-          "h": 1,
-          "content": "| Notes"
-        },
-        {
-          "x": 3,
-          "y": 1,
-          "w": 1,
-          "h": 1,
-          "content": "Layouts of modern scientific documents"
-        },
-        {
-          "x": 3,
-          "y": 2,
-          "w": 1,
-          "h": 1,
-          "content": "Layouts of scanned modern magazines and scientific reports"
-        },
-        {
-          "x": 3,
-          "y": 3,
-          "w": 1,
-          "h": 1,
-          "content": "Layouts of scanned US newspapers from the 20th century"
-        },
-        {
-          "x": 3,
-          "y": 4,
-          "w": 1,
-          "h": 1,
-          "content": "Table region on modern scientific and business document"
-        },
-        {
-          "x": 3,
-          "y": 5,
-          "w": 1,
-          "h": 1,
-          "content": "Layouts of history Japanese documents"
-        }
-      ],
       "filetype": "image/jpeg",
       "languages": [
         "eng"