| 123456789101112131415161718192021222324252627 |
- from llama_index.readers.file import PandasExcelReader
- from llama_index.readers.docling import DoclingReader
- from llama_index.core.node_parser import MarkdownNodeParser
- from pathlib import Path
- '''
- https://docs.llamaindex.ai/en/stable/examples/data_connectors/DoclingReaderDemo/
- uv pip install llama-index-readers-docling llama-index-node-parser-docling llama-index-readers-file
- '''
- def read_docling():
- reader = DoclingReader(export_type=DoclingReader.ExportType.MARKDOWN, )
- res = reader.load_data(Path(r"C:\Users\mg\Downloads\塑料园艺多肉三件套-文案制作模版.xlsx"))
- print(res[0].text)
- with open("docling.md", "w", encoding="utf-8") as f:
- f.write(res[0].text)
- def read_excel(file_path):
- reader = PandasExcelReader()
- res = reader.load_data(file=r"C:\Users\mg\Downloads\塑料园艺多肉三件套-文案制作模版.xlsx")
- print(res)
- def main():
- read_docling()
- if __name__ == "__main__":
- main()
|