HuggingFaceLLMPredictor
LangchainEmbedding
ServiceContext
llm_predictor.model.to('cpu')
del llm_predictor
torch.cuda.empty_cache()
embed_model
embed_model._langchain_embedding.client