Ritesh-hf's picture
remove print statement
eb2df2d
raw
history blame
4.83 kB
import eventlet
eventlet.monkey_patch()
from dotenv import load_dotenv
from flask import Flask, request, render_template
from flask_cors import CORS
from flask_socketio import SocketIO, emit
from langchain_core.output_parsers import StrOutputParser
from langchain_core.prompts import ChatPromptTemplate
from langchain_core.runnables import RunnablePassthrough
from langchain_huggingface.embeddings import HuggingFaceEmbeddings
from langchain.retrievers.document_compressors import EmbeddingsFilter
from langchain.retrievers import ContextualCompressionRetriever
from langchain.retrievers import EnsembleRetriever
from langchain_community.vectorstores import FAISS
from langchain_groq import ChatGroq
from langchain import hub
import pickle
import os
# Load environment variables
load_dotenv(".env")
USER_AGENT = os.getenv("USER_AGENT")
GROQ_API_KEY = os.getenv("GROQ_API_KEY")
SECRET_KEY = os.getenv("SECRET_KEY")
SESSION_ID_DEFAULT = "abc123"
# Set environment variables
os.environ['USER_AGENT'] = USER_AGENT
os.environ["GROQ_API_KEY"] = GROQ_API_KEY
os.environ["TOKENIZERS_PARALLELISM"] = 'true'
# Initialize Flask app and SocketIO with CORS
app = Flask(__name__)
CORS(app)
socketio = SocketIO(app, cors_allowed_origins="*")
app.config['SESSION_COOKIE_SECURE'] = True # Use HTTPS
app.config['SESSION_COOKIE_HTTPONLY'] = True
app.config['SECRET_KEY'] = SECRET_KEY
embed_model = HuggingFaceEmbeddings(model_name="Alibaba-NLP/gte-multilingual-base", model_kwargs={"trust_remote_code":True})
llm = ChatGroq(
model="llama-3.1-8b-instant",
temperature=0.0,
max_tokens=1024,
max_retries=2
)
excel_vectorstore = FAISS.load_local(folder_path="./faiss_excel_doc_index", embeddings=embed_model, allow_dangerous_deserialization=True)
word_vectorstore = FAISS.load_local(folder_path="./faiss_recursive_split_word_doc_index", embeddings=embed_model, allow_dangerous_deserialization=True)
excel_vectorstore.merge_from(word_vectorstore)
combined_vectorstore = excel_vectorstore
with open('combined_recursive_keyword_retriever.pkl', 'rb') as f:
combined_keyword_retriever = pickle.load(f)
combined_keyword_retriever.k = 1000
semantic_retriever = combined_vectorstore.as_retriever(search_type="mmr", search_kwargs={"k": 100})
# initialize the ensemble retriever
ensemble_retriever = EnsembleRetriever(
retrievers=[combined_keyword_retriever, semantic_retriever], weights=[0.5, 0.5]
)
embeddings_filter = EmbeddingsFilter(embeddings=embed_model, similarity_threshold=0.4)
compression_retriever = ContextualCompressionRetriever(
base_compressor=embeddings_filter, base_retriever=semantic_retriever
)
template = """
User Instructions:
You are an Arabic AI Assistant focused on providing clear, concise responses.
Always answer truthfully. If the user query is irrelevant to the provided CONTEXT, respond stating the reason.
Generate responses in Arabic. Format any English words and numbers appropriately for clarity.
Round off numbers with decimal integers to two decimal integers.
Use bullet points or numbered lists where applicable for better organization.
Provide detailed yet concise answers, covering all important aspects.
Remember, responding outside the CONTEXT may lead to the termination of the interaction.
CONTEXT: {context}
Query: {question}
After generating your response, ensure proper formatting and text direction of Arabic and English words/numbers. Return only the AI-generated answer.
"""
prompt = ChatPromptTemplate.from_template(template)
output_parser = StrOutputParser()
def format_docs(docs):
return "\n\n".join(doc.page_content for doc in docs)
rag_chain = (
{"context": compression_retriever.with_config(run_name="Docs") | format_docs, "question": RunnablePassthrough()}
| prompt
| llm
| output_parser
)
# Function to handle WebSocket connection
@socketio.on('connect')
def handle_connect():
emit('connection_response', {'message': 'Connected successfully.'}, room=request.sid)
@socketio.on('ping')
def handle_ping(data):
emit('ping_response', {'message': 'Healthy Connection.'}, room=request.sid)
# Function to handle WebSocket disconnection
@socketio.on('disconnect')
def handle_disconnect():
emit('connection_response', {'message': 'Disconnected successfully.'})
# Function to handle WebSocket messages
@socketio.on('message')
def handle_message(data):
question = data.get('question')
try:
for chunk in rag_chain.stream(question):
emit('response', chunk, room=request.sid)
except Exception as e:
emit('response', {"error": "An error occurred while processing your request."}, room=request.sid)
# Home route
@app.route("/")
def index_view():
return render_template('chat.html')
# Main function to run the app
if __name__ == '__main__':
socketio.run(app, debug=True)