Spaces:

traversaal-internal
/

pro-search-api

Runtime error

vhr1007 commited on Aug 26, 2024

Commit

b9ffe6a

1 Parent(s): 88bbe7d

azure_open_ai

Files changed (2) hide show

config.py CHANGED Viewed

@@ -5,4 +5,5 @@ QDRANT_URL = os.getenv('QDRANT_URL')
 QDRANT_ACCESS_TOKEN = os.getenv('QDRANT_ACCESS_TOKEN')
 OPENAI_API_KEY = os.getenv('OPENAI_API_KEY')
 JWKS_URL = os.getenv('JWKS_URL')
-X_API_KEY = os.getenv('X_API_KEY')  # Replace with your actual API key

 QDRANT_ACCESS_TOKEN = os.getenv('QDRANT_ACCESS_TOKEN')
 OPENAI_API_KEY = os.getenv('OPENAI_API_KEY')
 JWKS_URL = os.getenv('JWKS_URL')
+X_API_KEY = os.getenv('X_API_KEY')
+AZURE_OPENAI_KEY = os.getenv('AZURE_OPENAI_KEY')

services/openai_service.py CHANGED Viewed

@@ -1,13 +1,24 @@
 import logging
 import os
 from openai import OpenAI
 from openai import OpenAIError, RateLimitError
-from config import OPENAI_API_KEY
 # Initialize the OpenAI client with the API key from the environment variable
 #api_key = os.getenv('OPENAI_API_KEY')
-client = OpenAI(api_key=OPENAI_API_KEY)
 def generate_rag_response(json_output, user_query):
     logging.info("Generating RAG response")
@@ -28,8 +39,9 @@ def generate_rag_response(json_output, user_query):
         # Create a chat completion request
         chat_completion = client.chat.completions.create(
             messages=main_prompt,
-            model="gpt-4o-mini",  # Use the gpt-4o-mini model
-            timeout=10
         )
         # Log the response from the model
@@ -46,3 +58,8 @@ def generate_rag_response(json_output, user_query):
     except Exception as e:
         logging.error(f"Unexpected error: {e}")
         return None, str(e)

 import logging
 import os
 from openai import OpenAI
+from openai import AzureOpenAI
 from openai import OpenAIError, RateLimitError
+from config import OPENAI_API_KEY, AZURE_OPENAI_KEY
 # Initialize the OpenAI client with the API key from the environment variable
 #api_key = os.getenv('OPENAI_API_KEY')
+# client = OpenAI(api_key=OPENAI_API_KEY)
+AZURE_OPENAI_ENDPOINT = os.getenv('AZURE_OPENAI_ENDPOINT')
+AZURE_API_VERSION = "2024-02-15-preview"  # API version for Azure OpenAI
+# Initialize the Azure OpenAI client with the endpoint and API key
+client = AzureOpenAI(
+    azure_endpoint=AZURE_OPENAI_ENDPOINT,
+    api_key=AZURE_OPENAI_KEY,
+    api_version=AZURE_API_VERSION
+)
 def generate_rag_response(json_output, user_query):
     logging.info("Generating RAG response")
         # Create a chat completion request
         chat_completion = client.chat.completions.create(
             messages=main_prompt,
+            model="gpt-35-turbo",  # Use the gpt-4o-mini model
+            max_tokens=486,  # Limit the maximum number of tokens in the response
+            temperature=1
         )
         # Log the response from the model
     except Exception as e:
         logging.error(f"Unexpected error: {e}")
         return None, str(e)