OBP-Opey/app.py at main · OpenBankProject/OBP-Opey · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
# Description: This file contains the main Flask application that serves as the backend for the chatbot.
import redis
import openai
import os
import logging
import json
import sys
import subprocess
import uvicorn
import socketio
import traceback
import requests


from utils import get_conversation, save_conversation, overwrite_conversation, verifyJWT, search_index, num_tokens_from_conversation, token_required
from dotenv import load_dotenv
from openai import AsyncAssistantEventHandler
from typing_extensions import override
from fastapi import FastAPI

try:
    load_dotenv()
except:
    print("warning, error loading .env")

# Init FastAPI app
app = FastAPI()

#Socket io (sio) create a Socket.IO server
sio=socketio.AsyncServer(cors_allowed_origins='*',async_mode='asgi')

#wrap with ASGI application
socket_app = socketio.ASGIApp(sio)
app.mount("/", socket_app)

# configure logging
logging.basicConfig(level=logging.INFO)

# Configure Redis
redis_host = os.getenv('REDIS_HOST', 'localhost')
redis_port = os.getenv('REDIS_PORT', 6379)
logging.info(f"Connecting to Redis at {redis_host}:{redis_port}")
redis_client = redis.StrictRedis(host=redis_host, port=int(redis_port), db=0)

# Test if Redis is connected
try:
    redis_client.ping()
except redis.exceptions.ConnectionError as e:
    logging.error(f"Error connecting to Redis: {e}")
    logging.info("Are you sure that you have correctly set the 'REDIS_HOST' and 'REDIS_PORT' environment variables?")
    sys.exit(1)

# Set your OpenAI API key, create OpenAI client
openai.api_key = os.getenv("OPENAI_API_KEY")
openai_client = openai.AsyncOpenAI()

endpoint_metadata_path = os.getenv("ENDPOINT_METADATA_PATH")
glossary_metadata_path = os.getenv("GLOSSAY_METADATA_PATH")

endpoint_vector_database_path = os.getenv("ENDPOINT_VECTOR_DATABASE_PATH")
glossary_vector_database_path = os.getenv("GLOSSARY_VECTOR_DATABASE_PATH")

if not endpoint_metadata_path:
    raise FileNotFoundError("Could not find endpoint_metadata.json make sure it is set in the .env")
if not endpoint_vector_database_path:
    raise FileNotFoundError("Could not find endpoint vector database make sure it is set in the .env")
if not glossary_metadata_path:
    raise FileNotFoundError("Could not find glossary_metadata.json make sure it is set in the .env")
if not glossary_metadata_path:
    raise FileNotFoundError("Could not find glossary vector database make sure it is set in the .env")


class OpeyEventHandler(AsyncAssistantEventHandler):
    def __init__(self, user_sid, *args, **kwargs):
        self.user_sid = user_sid
        super().__init__(*args, **kwargs)

    @override
    async def on_text_delta(self, delta, snapshot):
        await sio.emit('response stream delta', {'assistant': f"{delta.value}"}, to=self.user_sid)

    async def on_message_created(self, message):
        await sio.emit('response stream start', to=self.user_sid)

    async def on_event(self, event) -> None:

        if event.event != "thread.message.delta":
            logging.info(f"Event: {event.event}")

        if event.event == "thread.run.failed":
            logging.error(f"Thread run failed: {event.data.last_error}")
            if event.data.last_error.code == "rate_limit_exceeded":
                await sio.emit('error', {'error': 'Rate limit exceeded'}, to=self.user_sid)
            else:
                await sio.emit('error', {'error': 'Thread run failed'}, to=self.user_sid)

        return super().on_event(event)

    async def on_message_done(self, message):
        await sio.emit('response stream end', to=self.user_sid)

class Conversation():
    def __init__(self, assistant_id: str):
        """
        Initializes a new instance of the Conversation class.

        Parameters:
        assistant_id (str): The ID of the openai assistant used for Opey.

        Returns:
        None
        """
        self.assistant_id = assistant_id
        self.conversation = []

    async def handle_connect(self, user_sid, auth):
        # Access the headers here and perform any necessary operations
        response, jwt_valid = verifyJWT(auth["token"])
        if not jwt_valid:
            logging.error(f"Invalid JWT: {response}")
            await sio.emit('error', {'error': 'Invalid JWT'})
            return
        else:
            logging.info(f"WebSocket opened with: {response}")
            logging.info("Connecting to assistant")
            self.opey_assistant = await openai_client.beta.assistants.retrieve(self.assistant_id)
            logging.info("Creating new assistant thread")
            self.thread = await openai_client.beta.threads.create()
            await sio.emit('message', {'data': 'Chatting with Opey'})
        return

    async def handle_chat(self, user_sid, data):
        """
        Chat function that handles the conversation between the user and the assistant.

        Args:
            decoded_token (dict): Decoded json web token containing user information. This is used to verify incoming requests.


        Returns:
            dict: JSON response containing the assistant's reply.
        """

        session_id = data.get('session_id')
        user_message = data.get('message')
        obp_api_host = data.get('obp_api_host')

        #print(f"Incoming message from user {decoded_token['username']} (obp_user_id: {decoded_token['user_id']}):\n{json.dumps(data, indent=2)}")

        # Validate session_id and user_message
        if not session_id or not user_message:
            await sio.emit('error', {'error': 'session_id and message are required'}, to=user_sid)
            return

        # Add message to assistant thread
        message = await openai_client.beta.threads.messages.create(self.thread.id, role="user", content=user_message)

        # Get conversation history from redis
        # Should implement a fallback mechanism in case redis does not work
        try:
            conversation = [json.loads(message) for message in await get_conversation(session_id, redis_client, app)]
        except Exception as e:
            logging.error(f"error occurred: {str(e)}")
            logging.error(traceback.format_exc())  # Add this line to print the traceback
            await sio.emit('error', {'error': f"could not load conversation"}, to=user_sid)
            return

        # Append user message to conversation
        conversation.append({"role": "user", "content": user_message})

        # Search for matches in the vector database
        # We query an assistant here to check if additional context is needed to answer the prompt
        context_classifier_assistant = await openai_client.beta.assistants.retrieve("asst_dtGSW0NS1HbxdpjQAbqXXf9F")

        context_run = await openai_client.beta.threads.runs.create_and_poll(
            thread_id=self.thread.id,
            assistant_id=context_classifier_assistant.id,
        )

        if context_run.status == "completed":
            messages = await openai_client.beta.threads.messages.list(thread_id=self.thread.id)
            context_messages = [msg async for msg in messages if msg.assistant_id == context_classifier_assistant.id]

        try:
            result = json.loads(context_messages[0].content[0].text.value)
            logging.info(f"Context requirements: {result['context_required']}")
        except Exception as e:
            logging.info(f"Could not get context requirements from assistant: {e}")

        if result['context_required'] == 'true':
            try:
                endpoint_matches = await search_index(user_message, endpoint_vector_database_path, endpoint_metadata_path, openai_client)
            except Exception as e:
                logging.info(f"Error searching for endpoint matches: {e}")
                await sio.emit('error', {'error': 'Internal Server Error'}, to=user_sid)
                return

            try:
                glossary_matches = await search_index(user_message, glossary_vector_database_path, glossary_metadata_path, openai_client)
            except Exception as e:
                logging.info(f"Error searching for glossary matches: {e}")
                await sio.emit('error', {'error': 'Internal Server Error'}, to=user_sid)

            if endpoint_matches:
                match_list = [f"{m['path']} ({m['summary']})\n" for m in endpoint_matches]
                formatted_matches = ', '.join(match_list)
                logging.info(f"Matches for query: \n{formatted_matches}\n")
                endpoint_context = "Here are endpoints (in order of similarity) that matched the users query in a vector database search of the OpenBankProject's API documentation:\n"
                for match in endpoint_matches:
                    endpoint_context += f"\nEndpoint: {match['method'].upper()} {match['path']}\n"
                    endpoint_context += f"Description: {match['description']}\n"
                    if match['parameters'] != {}:
                        try:
                            endpoint_context += f"Parameters: {', '.join([p for p in match['parameters']['properties']])}\n"
                        except Exception as e:
                            logging.info(f"Error obtaining context for {match}: \n{e}")
                    else:
                        endpoint_context += f"Parameters: This endpoint does not require any parameters"
                    responses = [f"{r['code']} {r['body']}" for r in match['responses']]
                    formatted_responses = ', '.join(responses)
                    endpoint_context += f"Responses: \n{formatted_responses}\n"


            else:
                endpoint_context = "No relevant endpoints were found for the users query when searching a vector database of the OpenBankProject's API documentation."


            if glossary_matches:
                glossary_context = "Here are some glossary entries (in order of similarity) that matched the users query in a vector database search of the OpenBankProject's API documentation:\n"
                for match in glossary_matches:
                    glossary_context += f"\nTitle: {match['title']}\n"
                    glossary_context += f"Description: {match['description']}\n"

            else:
                glossary_context = "No relevant glossary items were found for the users query when searching a vector database of the OpenBankProject's API documentation."
        else:
            endpoint_context = "The user message did not require additional endpoint context to answer the prompt."
            glossary_context = "The user message did not require additional glossary context to answer the prompt."

        # Create a run with the user message
        async with openai_client.beta.threads.runs.stream(
            thread_id=self.thread.id,
            assistant_id=self.opey_assistant.id,
            additional_instructions=f"""When giving examples of endpoints, always use the current OBP API host URL: {obp_api_host}
                Here is the some helpful information that could assist an answer to the current question: {endpoint_context} \n {glossary_context}""",
            event_handler=OpeyEventHandler(user_sid=user_sid),
            tool_choice="none", # This is to prevent context being added from the file_search tool as well as the vector searching we are doing in house, which causes the rate limit to be reached frequently
        ) as stream:
            await stream.until_done()

conversation = Conversation("asst_vbwdYbWsTisP7YmwQhykiEwp")

@sio.on('connect')
async def connect(event, sid, auth):
    await conversation.handle_connect(sid, auth)

@sio.on('chat')
async def chat(sid, data):
    await conversation.handle_chat(sid, data)

"""
@app.post('/feedback')
async def feedback():
    data = request.json

@app.post('/create-consent')
async def create_consent(request: requests.Request):
    data = await request.json()
"""

if __name__ == '__main__':
    logging_level = os.getenv('LOG_LEVEL', 'INFO')
    uvicorn.run("app:app", host="0.0.0.0", port=5000, lifespan="on", reload=True, log_level=logging_level.lower())