diff --git a/unstructured/partition/pptx.py b/unstructured/partition/pptx.py index 0fc46c773e..7c55bcdefd 100644 --- a/unstructured/partition/pptx.py +++ b/unstructured/partition/pptx.py @@ -252,7 +252,7 @@ def _iter_table_element(self, graphfrm: GraphicFrame) -> Iterator[Table]: return html_text = htmlify_matrix_of_cell_texts( - [[cell.text for cell in row.cells] for row in rows] + [[cell.text.replace("\n", " ") for cell in row.cells] for row in rows] ) html_table = HtmlTable.from_html_text(html_text)