image_llm = OpenAIMultiModal( model='gpt-4o', output_cls=output_class, api_key=api_key, max_new_tokens=1000, temperature=0.0, ) image_doc = load_image_urls([image_url]) response_vision = image_llm.complete( prompt=prompt, image_documents=image_doc, )