from llama_index import Document document = Document("my pdf text string", doc_id="optional doc id", extra_info={"optional": "info dict"})