from quivr_core.parsers import SimpleParser parser = SimpleParser() documents = parser.parse("path/to/document.txt") for doc in documents: print(f"Content: {doc.page_content}")
parser = SimpleParser( chunk_size=500, # Number of characters per chunk chunk_overlap=50, # Number of overlapping characters between chunks strip_whitespace=True, # Remove excess whitespace lowercase=False # Convert text to lowercase )
Was this page helpful?