24 lines
951 B
Python
24 lines
951 B
Python
|
|
from docx import Document
|
||
|
|
|
||
|
|
report_path = r'C:\Users\UI\Desktop\医疗报告\backend\reports\filled_report_20260212_154247.docx'
|
||
|
|
doc = Document(report_path)
|
||
|
|
body = doc.element.body
|
||
|
|
children = list(body)
|
||
|
|
|
||
|
|
keywords = ['overall health', '整体健康', 'medical intervention', '医学干预',
|
||
|
|
'functional medical health', '功能医学健康建议',
|
||
|
|
'nutrition intervention', '营养干预', 'exercise intervention', '运动干预',
|
||
|
|
'sleep', '睡眠', 'lifestyle', '生活方式', 'long-term', '长期随访',
|
||
|
|
'功能医学检测档案', 'abnormal index', '异常指标']
|
||
|
|
|
||
|
|
print(f"文档总元素数: {len(children)}")
|
||
|
|
print("=" * 80)
|
||
|
|
|
||
|
|
for i, elem in enumerate(children):
|
||
|
|
text = ''.join(elem.itertext()).strip()
|
||
|
|
if text:
|
||
|
|
text_lower = text.lower()
|
||
|
|
if any(kw in text_lower for kw in keywords):
|
||
|
|
tag = elem.tag.split("}")[-1]
|
||
|
|
print(f'[{i}] {tag}: {text[:150]}')
|