-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathlangchain_code.py
More file actions
61 lines (45 loc) · 2.39 KB
/
langchain_code.py
File metadata and controls
61 lines (45 loc) · 2.39 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
from langchain_community.vectorstores import FAISS
from langchain_google_genai import GoogleGenerativeAI
from langchain_community.document_loaders.csv_loader import CSVLoader
from langchain_huggingface.embeddings import HuggingFaceEmbeddings
from langchain.prompts import PromptTemplate
from langchain.chains import RetrievalQA
import os
from dotenv import load_dotenv
load_dotenv() # take environment variables from .env (especially openai api key)
# Create Google Palm LLM model
llm = GoogleGenerativeAI(google_api_key=os.environ["GOOGLE_API_KEY"], model="models/text-bison-001", temperature=0.1)
# # Initialize instructor embeddings using the Hugging Face model
embeddings = HuggingFaceEmbeddings(model_name="hkunlp/instructor-large")
vectordb_file_path = "faiss_index"
def create_vector_db():
# Load data from FAQ sheet
loader = CSVLoader(file_path='website_faqs.csv', source_column="prompt")
data = loader.load()
# Create a FAISS instance for vector database from 'data'
vectordb = FAISS.from_documents(documents=data, embedding=embeddings)
# Save vector database locally
vectordb.save_local(vectordb_file_path)
def get_qa_chain():
# Load the vector database from the local folder
vectordb = FAISS.load_local(vectordb_file_path, embeddings, allow_dangerous_deserialization=True)
# Create a retriever for querying the vector database
retriever = vectordb.as_retriever(score_threshold=0.7)
prompt_template = """Given the following context and a question, generate an answer based on this context only.
In the answer try to provide as much text as possible from "response" section in the source document context without making much changes.
If the answer is not found in the context, kindly state "I don't know." Don't try to make up an answer.
CONTEXT: {context}
QUESTION: {question}"""
PROMPT = PromptTemplate(
template=prompt_template, input_variables=["context", "question"]
)
chain = RetrievalQA.from_chain_type(llm=llm,
chain_type="stuff",
retriever=retriever,
input_key="query",
return_source_documents=True,
chain_type_kwargs={"prompt": PROMPT})
return chain
if __name__ == "__main__":
create_vector_db()
chain = get_qa_chain()