From fc24a0546790c178475faae1217477ba651576ec Mon Sep 17 00:00:00 2001 From: Logan Markewich Date: Tue, 12 Sep 2023 09:48:08 -0600 Subject: [PATCH 1/3] remove default api version --- llama_index/llms/azure_openai.py | 3 +-- 1 file changed, 1 insertion(+), 2 deletions(-) diff --git a/llama_index/llms/azure_openai.py b/llama_index/llms/azure_openai.py index e85c82f806120..23bd7579112ce 100644 --- a/llama_index/llms/azure_openai.py +++ b/llama_index/llms/azure_openai.py @@ -6,7 +6,6 @@ from llama_index.llms.openai import OpenAI AZURE_OPENAI_API_TYPE = "azure" -AZURE_OPENAI_VERSION = "2023-08-01-preview" class AzureOpenAI(OpenAI): @@ -47,7 +46,7 @@ def __init__( api_key: Optional[str] = None, api_type: Optional[str] = AZURE_OPENAI_API_TYPE, api_base: Optional[str] = None, - api_version: Optional[str] = AZURE_OPENAI_VERSION, + api_version: Optional[str] = None, callback_manager: Optional[CallbackManager] = None, **kwargs: Any, ) -> None: From 22dcac14ce0e9ae90c405f3ace4acab3d150f966 Mon Sep 17 00:00:00 2001 From: Logan Markewich Date: Tue, 12 Sep 2023 09:48:26 -0600 Subject: [PATCH 2/3] Imporve streaming support for azure --- llama_index/llms/openai.py | 20 ++++++++++++++++---- 1 file changed, 16 insertions(+), 4 deletions(-) diff --git a/llama_index/llms/openai.py b/llama_index/llms/openai.py index 2e71fcc43698f..3ba109b8f5b7d 100644 --- a/llama_index/llms/openai.py +++ b/llama_index/llms/openai.py @@ -226,7 +226,10 @@ def gen() -> ChatResponseGen: stream=True, **all_kwargs, ): - delta = response["choices"][0]["delta"] + if len(response["choices"]) > 0: + delta = response["choices"][0]["delta"] + else: + delta = "" role = delta.get("role", "assistant") content_delta = delta.get("content", "") or "" content += content_delta @@ -302,7 +305,10 @@ def gen() -> CompletionResponseGen: stream=True, **all_kwargs, ): - delta = response["choices"][0]["text"] + if len(response["choices"]) > 0: + delta = response["choices"][0]["text"] + else: + delta = "" text += delta yield CompletionResponse( delta=delta, @@ -439,7 +445,10 @@ async def gen() -> ChatResponseAsyncGen: stream=True, **all_kwargs, ): - delta = response["choices"][0]["delta"] + if len(response["choices"]) > 0: + delta = response["choices"][0]["delta"] + else: + delta = "" role = delta.get("role", "assistant") content_delta = delta.get("content", "") or "" content += content_delta @@ -517,7 +526,10 @@ async def gen() -> CompletionResponseAsyncGen: stream=True, **all_kwargs, ): - delta = response["choices"][0]["text"] + if len(response["choices"]) > 0: + delta = response["choices"][0]["text"] + else: + delta = "" text += delta yield CompletionResponse( delta=delta, From d10e47c0091cca22612c361548afd81028a6c0cc Mon Sep 17 00:00:00 2001 From: Logan Markewich Date: Tue, 12 Sep 2023 09:51:28 -0600 Subject: [PATCH 3/3] changelog --- CHANGELOG.md | 1 + 1 file changed, 1 insertion(+) diff --git a/CHANGELOG.md b/CHANGELOG.md index 4b02d691cfdf9..e0fd4fa27561e 100644 --- a/CHANGELOG.md +++ b/CHANGELOG.md @@ -4,6 +4,7 @@ ### Bug Fixes / Nits - Allowed `simple` mode to work with `as_chat_engine()` (#7637) +- Fixed index error in azure streaming (#7646) ## [0.8.24] - 2023-09-11