File size: 668 Bytes
49cf970
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
from llama_index.readers.docling import DoclingReader
from llama_index.node_parser.docling import DoclingNodeParser
import os
from pathlib import Path

def inspect_nodes():
    pdf_path = "nvidia_q4_fy24.pdf"
    reader = DoclingReader(export_type=DoclingReader.ExportType.JSON)
    documents = reader.load_data(file_path=Path(pdf_path))
    
    parser = DoclingNodeParser()
    nodes = parser.get_nodes_from_documents(documents)
    
    if nodes:
        print(f"Node 0 Metadata: {nodes[0].metadata.keys()}")
        print(f"Node 0 Metadata Content: {nodes[0].metadata}")
    else:
        print("No nodes created.")

if __name__ == "__main__":
    inspect_nodes()