移除了print特定列

2025-06-09 19:06:09 +08:00 · 2025-06-09 19:06:09 +08:00 · d5fbd8d620
parent ab4d2da1cf
commit d5fbd8d620
1 changed files with 14 additions and 25 deletions
--- a/management/server/services/knowledgebases/excel_parser.py
+++ b/management/server/services/knowledgebases/excel_parser.py
@ -1,32 +1,21 @@
 import pandas as pd
-def parse_excel(file_path):  
+def parse_excel(file_path):
-    # 读取所有工作表  
+    # 读取所有工作表
-    all_sheets = pd.read_excel(file_path, sheet_name=None)  # 读取所有sheet  
+    all_sheets = pd.read_excel(file_path, sheet_name=None)  # 读取所有sheet
    blocks = []
    for sheet_name, df in all_sheets.items():
        df = df.fillna(method="ffill")  # 填充合并的单元格
        headers = df.columns.tolist()
        for _, row in df.iterrows():
            html_table = "<html><body><table><tr>{}</tr><tr>{}</tr></table></body></html>".format("".join(f"<td>{col}</td>" for col in headers), "".join(f"<td>{row[col]}</td>" for col in headers))
            block = {"type": "table", "img_path": "", "table_caption": [f"Sheet: {sheet_name}"], "table_footnote": [], "table_body": f"{html_table}", "page_idx": 0}
            blocks.append(block)
    blocks = []  
    for sheet_name, df in all_sheets.items():  
        df = df.fillna(method='ffill')#填充合并的单元格
        headers = df.columns.tolist()  
        for _, row in df.iterrows():  
            html_table = "<html><body><table><tr>{}</tr><tr>{}</tr></table></body></html>".format(  
                "".join(f"<td>{col}</td>" for col in headers),   
                "".join(f"<td>{row[col]}</td>" for col in headers)  
            )
            print(row['测试分类'])
            block = {  
                "type": "table",   
                "img_path": "",   
                "table_caption": [f"Sheet: {sheet_name}"],
                "table_footnote": [],   
                "table_body": f"{html_table}",   
                "page_idx": 0  
            }  
            blocks.append(block)  
    return blocks