From 7799e392985f0bd9235465327a3876b300a903e9 Mon Sep 17 00:00:00 2001 From: liuyuanchuang Date: Mon, 9 Feb 2026 22:18:30 +0800 Subject: [PATCH] fix: image as element --- app/services/ocr_service.py | 9 ++-- create_table.py | 100 ++++++++++++++++++++++++++++++++++++ create_table_pandas.py | 91 ++++++++++++++++++++++++++++++++ csv_to_xlsx.py | 88 +++++++++++++++++++++++++++++++ 数据表.csv | 23 +++++++++ 5 files changed, 308 insertions(+), 3 deletions(-) create mode 100644 create_table.py create mode 100644 create_table_pandas.py create mode 100644 csv_to_xlsx.py create mode 100644 数据表.csv diff --git a/app/services/ocr_service.py b/app/services/ocr_service.py index 8b52015..f1eb126 100644 --- a/app/services/ocr_service.py +++ b/app/services/ocr_service.py @@ -143,7 +143,7 @@ def _clean_latex_syntax_spaces(expr: str) -> str: # Remove spaces everywhere else (e.g., x \in -> x\in is fine) # Strategy: remove spaces before \ and between non-command chars, # but preserve the space after \command when followed by a non-\ char - cleaned = re.sub(r"\s+(?=\\)", "", content) # remove space before \cmd + cleaned = re.sub(r"\s+(?=\\)", "", content) # remove space before \cmd cleaned = re.sub(r"(?