I have a a streamlit model running (code attached). it was initially working but then today it gave an error
openai.AuthenticationError: Error code: 401 - {'statusCode': 401, 'message': 'Unauthorized. Access token is missing, invalid, audience is incorrect (https://cognitiveservices.azure.com), or have expired.'}
i regenerated the tokens, redeployed the models ( gpt-35-turbo-16k and text-embedding-3-large). But that still didn't fix the problem. I clicked on the uri endpoints from the openai studio and it seemed to have returned a 404, resource not found. Im unsure on what to do to rectify the issue
import os
from dotenv import load_dotenv
from llama_index.llms.azure_openai import AzureOpenAI
from llama_index.embeddings.azure_openai import AzureOpenAIEmbedding
import pickle
from llama_index.core import Settings
import streamlit as st
import time
# Load env variables
def load_env_vars():
api_key = os.getenv("OPENAI_API_KEY")
azure_endpoint = os.getenv("OPENAI_API_ENDPOINT")
api_version = os.getenv("OPENAI_API_VERSION")
print("env variables successfully loaded")
return api_key, azure_endpoint, api_version
api_key, azure_endpoint, api_version = load_env_vars()
# Load pickle file
def load_index():
with open("./bystander_index.pkl", 'rb') as file:
index = pickle.load(file)
print("Pickle successfully loaded")
query_engine = index.as_query_engine()
return query_engine
query_engine = load_index()
st.header("Chat with the Bystander")
if "messages" not in st.session_state.keys(): # Initialize the chat message history
st.session_state.messages = [
{"role": "assistant", "content": "Ask me a question about the Bystander!"}
if prompt := st.chat_input("Your question"): # Prompt for user input and save to chat history
st.session_state.messages.append({"role": "user", "content": prompt})
for message in st.session_state.messages: # Display the prior chat messages
with st.chat_message(message["role"]):
# If last message is not from assistant, generate a new response
if st.session_state.messages[-1]["role"] != "assistant":
with st.chat_message("assistant"):
with st.spinner("Thinking..."):
t_0 = time.time()
answer = query_engine.query(st.session_state.messages[-1]["content"])
print(f'Time taken for that is {time.time() - t_0}')
message = {"role": "assistant", "content": answer.response}
st.session_state.messages.append(message) # Add response to message history