Files
hospital_performance/check_extracted.py
2026-02-28 15:16:15 +08:00

32 lines
1.1 KiB
Python

import json
import sys
sys.stdout.reconfigure(encoding='utf-8')
# Read existing extracted content
with open(r"D:\医院绩效系统\extracted_content.json", 'r', encoding='utf-8') as f:
data = json.load(f)
print(f"Total files extracted: {len(data)}")
print("\nAll file names:")
for filename in sorted(data.keys()):
print(f" {filename}")
# Find key appendix files
print("\n\n=== KEY APPENDIX FILES ===\n")
key_patterns = ['附表一', '附表二', '附表三', '附表四', '附表五', '附表六', '附表七', '附表八', '附表九', '附表十', '附表十一', '附表十二', '附表十三']
for pattern in key_patterns:
found = [f for f in data.keys() if pattern in f]
if found:
print(f"\n{pattern}:")
for f in found:
print(f" - {f}")
content = data[f]
if content and not content.startswith("Error"):
print(f" Content length: {len(content)} chars")
# Print first 1000 chars
print(f" Preview: {content[:1000]}...")
else:
print(f" Content: {content[:200] if content else 'Empty'}")