Spaces:

Rajeev-Isaac
/

NyaaySahaayak

Sleeping

App Files Files Community

Rajeev-Isaac commited on Mar 28, 2024

Commit

2be028b

verified ·

1 Parent(s): ae56acc

Upload 8 files

Browse files

Files changed (8) hide show

Indianconstitution.csv +0 -0
classify.py +29 -0
format.py +13 -0
ingest.py +18 -0
langchain_helper.py +50 -0
main.py +26 -0
requirements.txt +12 -0
translate.py +21 -0

Indianconstitution.csv ADDED Viewed

The diff for this file is too large to render. See raw diff

classify.py ADDED Viewed

	@@ -0,0 +1,29 @@

+from dotenv import load_dotenv
+import os
+import google.generativeai as genai
+load_dotenv()
+genai.configure(api_key=os.environ["GOOGLE_API_KEY"])
+model = genai.GenerativeModel('gemini-pro')
+def classify_query(query):
+    classifier_prompt = (
+        "## Query Classification\n"
+        "Please classify the following query as 'Indian Legal' or 'Non-Indian Legal':\n"
+        "Query: '{}'\n"
+        "Classification:"
+    )
+    # Compose prompt with the given query
+    prompt = classifier_prompt.format(query)
+    # Use Google Gen AI to generate a response based on the prompt
+    response = model.generate_content(prompt)
+    # Extract the generated classification from the response
+    classification = response.text.strip()
+    return classification

format.py ADDED Viewed

	@@ -0,0 +1,13 @@

+import re
+def format_paragraph(text):
+    text = text.replace("**", "</b>").replace("**", "<b>")
+    pattern = re.compile(r'</b>')
+    text = re.sub(pattern, lambda m: "<b>" if pattern.subn('', text[:m.start()])[1] % 2 == 0 else m.group(0), text)
+    text = text.replace('\n','<br>')
+    text = text.replace('*','&#8226')
+    return text

ingest.py ADDED Viewed

	@@ -0,0 +1,18 @@

+from langchain.embeddings import HuggingFaceInstructEmbeddings
+from langchain.vectorstores import FAISS
+from langchain.document_loaders.csv_loader import CSVLoader
+vectordb_file_path = "faiss_index"
+instructor_embeddings = HuggingFaceInstructEmbeddings(model_name="hkunlp/instructor-large")
+loader = CSVLoader(file_path='Indianconstitution.csv',encoding='utf-8-sig')
+data = loader.load()
+vectordb = FAISS.from_documents(documents=data,
+                                    embedding=instructor_embeddings)
+vectordb.save_local(vectordb_file_path)

langchain_helper.py ADDED Viewed

	@@ -0,0 +1,50 @@

+from langchain.vectorstores import FAISS
+from langchain.llms import GooglePalm
+from langchain.document_loaders.csv_loader import CSVLoader
+from langchain.embeddings import HuggingFaceInstructEmbeddings
+from langchain.prompts import PromptTemplate
+from langchain.chains import RetrievalQA
+import os
+from dotenv import load_dotenv
+load_dotenv()
+llm = GooglePalm(google_api_key=os.environ["GOOGLE_API_KEY"], temperature=0.1)
+instructor_embeddings = HuggingFaceInstructEmbeddings(model_name="hkunlp/instructor-large")
+vectordb_file_path = "faiss_index"
+def get_qa_chain():
+    vectordb = FAISS.load_local(vectordb_file_path, instructor_embeddings)
+    retriever = vectordb.as_retriever(score_threshold=0.7)
+    prompt_template = """You are a legal assistant chatbot, your name is "Nyaay Sahaayak", your main aim is to answer the queries related to the Indian laws and legal system,
+    if the question is not related to Indian laws and legal system kindly say dont know about the given question
+    Given the following context and a question, generate an answer based on the context or related to the Indian laws and legal system. The context given may not be always right
+    for the given question, hence cross verify yourself inorder to give an accurate answer that is only related to Indian laws and legal system.
+    Add some creativity to make the answer look readable and easily understandable. If the answer is not found in the context, kindly state "I don't know." Don't try to make up an answer,
+    if the question is out of the Indian laws and legal system, strictly deny them that you are not trained for it and only here for Indian law and legal system.
+    CONTEXT: {context}
+    QUESTION: {question}
+    """
+    PROMPT = PromptTemplate(
+        template=prompt_template, input_variables=["context", "question"]
+    )
+    chain = RetrievalQA.from_chain_type(llm=llm,
+                                        chain_type="stuff",
+                                        retriever=retriever,
+                                        input_key="query",
+                                        return_source_documents=True,
+                                        chain_type_kwargs={"prompt": PROMPT})
+    return chain
+if __name__ == "__main__":
+    chain = get_qa_chain()

main.py ADDED Viewed

	@@ -0,0 +1,26 @@

+from flask import Flask, render_template, request
+from translate import translate
+from classify import classify_query
+app = Flask(__name__,static_url_path='', static_folder='web/static')
+@app.route('/')
+def index():
+    return render_template('index.html')
+@app.route('/NyaaySahaayak')
+def NyaaySahaayak():
+    return render_template('NyaaySahaayak.html')
+@app.route('/chat', methods=['POST'])
+def chat():
+    user_message = request.form['user_message']
+    classification = classify_query(user_message)
+    if classification == 'Non-Indian Legal':
+        response = "Apologies, but I'm here to assist with questions related to Indian laws and legal matters only. If you have any queries within this domain, feel free to ask. Otherwise, I may not have the information you're looking for. Thank you for understanding."
+    else:
+        response = translate(user_message)
+    return {'bot_response': response}
+if __name__ == '__main__':
+    app.run(host='0.0.0.0', port=8000)

requirements.txt ADDED Viewed

	@@ -0,0 +1,12 @@

+langchain==0.0.284
+python-dotenv==1.0.0
+streamlit==1.22.0
+tiktoken==0.4.0
+faiss-cpu==1.7.4
+protobuf~=3.19.0
+google-generativeai
+sentence-transformers==2.2.2
+InstructorEmbedding==1.0.0
+googletrans==4.0.0rc1
+flask
+re

translate.py ADDED Viewed

	@@ -0,0 +1,21 @@

+from langchain_helper import get_qa_chain
+from googletrans import Translator
+from format import format_paragraph
+translator = Translator()
+chain = get_qa_chain()
+def translate(user_message):
+    query = user_message
+    result = translator.detect(query)
+    lang = result.lang
+    if(lang != 'en'):
+        translatedlang = translator.translate(query)
+        user_message = translatedlang.text
+    bot_response = chain(user_message)
+    response = bot_response['result']
+    response = format_paragraph(response)
+    if(lang != 'en'):
+        translation = translator.translate(response, dest=result.lang)
+        response = translation.text
+    return response