run-llama · Akash-Kumar-Sen · Nov 11, 2025 · logan-markewich · Nov 11, 2025 · Akash-Kumar-Sen
diff --git a/...dex-integrations/llms/llama-index-llms-google-genai/llama_index/llms/google_genai/base.py b/...dex-integrations/llms/llama-index-llms-google-genai/llama_index/llms/google_genai/base.py
@@ -19,7 +19,7 @@
     Callable,
 )
 
-
+from llama_index.core.async_utils import asyncio_run
 import llama_index.core.instrumentation as instrument
 from llama_index.core.base.llms.generic_utils import (
     chat_to_completion_decorator,
@@ -309,7 +309,7 @@ def _chat(self, messages: Sequence[ChatMessage], **kwargs: Any):
             **kwargs.pop("generation_config", {}),
         }
         params = {**kwargs, "generation_config": generation_config}
-        next_msg, chat_kwargs = asyncio.run(
+        next_msg, chat_kwargs = asyncio_run(
             prepare_chat_params(
                 self.model, messages, self.use_file_api, self._client, **params
             )
@@ -320,7 +320,7 @@ def _chat(self, messages: Sequence[ChatMessage], **kwargs: Any):
         )
 
         if self.use_file_api:
-            asyncio.run(
+            asyncio_run(
                 delete_uploaded_files([*chat_kwargs["history"], next_msg], self._client)
             )
 
@@ -366,7 +366,7 @@ def _stream_chat(
             **kwargs.pop("generation_config", {}),
         }
         params = {**kwargs, "generation_config": generation_config}
-        next_msg, chat_kwargs = asyncio.run(
+        next_msg, chat_kwargs = asyncio_run(
             prepare_chat_params(
                 self.model, messages, self.use_file_api, self._client, **params
             )
@@ -405,7 +405,7 @@ def gen() -> ChatResponseGen:
                 yield llama_resp
 
             if self.use_file_api:
-                asyncio.run(
+                asyncio_run(
                     delete_uploaded_files(
                         [*chat_kwargs["history"], next_msg], self._client
                     )
@@ -594,7 +594,7 @@ def structured_predict_without_function_calling(
 
         messages = prompt.format_messages(**prompt_args)
         contents = [
-            asyncio.run(
+            asyncio_run(
                 chat_message_to_gemini(message, self.use_file_api, self._client)
             )
             for message in messages
@@ -614,7 +614,7 @@ def structured_predict_without_function_calling(
         )
 
         if self.use_file_api:
-            asyncio.run(delete_uploaded_files(contents, self._client))
+            asyncio_run(delete_uploaded_files(contents, self._client))
 
         if isinstance(response.parsed, BaseModel):
             return response.parsed
@@ -644,7 +644,7 @@ def structured_predict(
 
             messages = prompt.format_messages(**prompt_args)
             contents = [
-                asyncio.run(
+                asyncio_run(
                     chat_message_to_gemini(message, self.use_file_api, self._client)
                 )
                 for message in messages
@@ -656,7 +656,7 @@ def structured_predict(
             )
 
             if self.use_file_api:
-                asyncio.run(delete_uploaded_files(contents, self._client))
+                asyncio_run(delete_uploaded_files(contents, self._client))
 
             if isinstance(response.parsed, BaseModel):
                 return response.parsed
@@ -738,7 +738,7 @@ def stream_structured_predict(
 
             messages = prompt.format_messages(**prompt_args)
             contents = [
-                asyncio.run(
+                asyncio_run(
                     chat_message_to_gemini(message, self.use_file_api, self._client)
                 )
                 for message in messages
@@ -767,7 +767,7 @@ def gen() -> Generator[Union[Model, FlexibleModel], None, None]:
                             yield streaming_model
 
                 if self.use_file_api:
-                    asyncio.run(delete_uploaded_files(contents, self._client))
+                    asyncio_run(delete_uploaded_files(contents, self._client))
 
             return gen()
         else: