Files
yiliao/backend/_check_report.py

24 lines
951 B
Python
Raw Normal View History

from docx import Document
report_path = r'C:\Users\UI\Desktop\医疗报告\backend\reports\filled_report_20260212_154247.docx'
doc = Document(report_path)
body = doc.element.body
children = list(body)
keywords = ['overall health', '整体健康', 'medical intervention', '医学干预',
'functional medical health', '功能医学健康建议',
'nutrition intervention', '营养干预', 'exercise intervention', '运动干预',
'sleep', '睡眠', 'lifestyle', '生活方式', 'long-term', '长期随访',
'功能医学检测档案', 'abnormal index', '异常指标']
print(f"文档总元素数: {len(children)}")
print("=" * 80)
for i, elem in enumerate(children):
text = ''.join(elem.itertext()).strip()
if text:
text_lower = text.lower()
if any(kw in text_lower for kw in keywords):
tag = elem.tag.split("}")[-1]
print(f'[{i}] {tag}: {text[:150]}')