移除了print特定列

This commit is contained in:
zstar 2025-06-09 19:06:09 +08:00 committed by GitHub
parent ab4d2da1cf
commit d5fbd8d620
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194
1 changed files with 14 additions and 25 deletions

View File

@ -1,32 +1,21 @@
import pandas as pd import pandas as pd
def parse_excel(file_path): def parse_excel(file_path):
# 读取所有工作表 # 读取所有工作表
all_sheets = pd.read_excel(file_path, sheet_name=None) # 读取所有sheet all_sheets = pd.read_excel(file_path, sheet_name=None) # 读取所有sheet
blocks = []
for sheet_name, df in all_sheets.items():
df = df.fillna(method="ffill") # 填充合并的单元格
headers = df.columns.tolist()
for _, row in df.iterrows():
html_table = "<html><body><table><tr>{}</tr><tr>{}</tr></table></body></html>".format("".join(f"<td>{col}</td>" for col in headers), "".join(f"<td>{row[col]}</td>" for col in headers))
block = {"type": "table", "img_path": "", "table_caption": [f"Sheet: {sheet_name}"], "table_footnote": [], "table_body": f"{html_table}", "page_idx": 0}
blocks.append(block)
blocks = []
for sheet_name, df in all_sheets.items():
df = df.fillna(method='ffill')#填充合并的单元格
headers = df.columns.tolist()
for _, row in df.iterrows():
html_table = "<html><body><table><tr>{}</tr><tr>{}</tr></table></body></html>".format(
"".join(f"<td>{col}</td>" for col in headers),
"".join(f"<td>{row[col]}</td>" for col in headers)
)
print(row['测试分类'])
block = {
"type": "table",
"img_path": "",
"table_caption": [f"Sheet: {sheet_name}"],
"table_footnote": [],
"table_body": f"{html_table}",
"page_idx": 0
}
blocks.append(block)
return blocks return blocks