RAGStringQueryEngine
, you are just calling llm.complete
from llama_index.response.schema import StreamingResponse response = llm.stream_complete(...) # source nodes and metadata optional response_obj = StreamingResponse(response, source_nodes=[], metadata={}) return response_obj
return self.response_synthesizer.syntheszie(query_str, nodes)