load_template.py 957 B

123456789101112131415161718192021222324252627
  1. from llama_index.readers.file import PandasExcelReader
  2. from llama_index.readers.docling import DoclingReader
  3. from llama_index.core.node_parser import MarkdownNodeParser
  4. from pathlib import Path
  5. '''
  6. https://docs.llamaindex.ai/en/stable/examples/data_connectors/DoclingReaderDemo/
  7. uv pip install llama-index-readers-docling llama-index-node-parser-docling llama-index-readers-file
  8. '''
  9. def read_docling():
  10. reader = DoclingReader(export_type=DoclingReader.ExportType.MARKDOWN, )
  11. res = reader.load_data(Path(r"C:\Users\mg\Downloads\塑料园艺多肉三件套-文案制作模版.xlsx"))
  12. print(res[0].text)
  13. with open("docling.md", "w", encoding="utf-8") as f:
  14. f.write(res[0].text)
  15. def read_excel(file_path):
  16. reader = PandasExcelReader()
  17. res = reader.load_data(file=r"C:\Users\mg\Downloads\塑料园艺多肉三件套-文案制作模版.xlsx")
  18. print(res)
  19. def main():
  20. read_docling()
  21. if __name__ == "__main__":
  22. main()