janakiramm/langchain_gemini_qa.py

## langchain_gemini_qa.py
### Install required modules and set the envvar for Gemini API Key
#pip install pypdf2
#pip install chromadb
#pip install google.generativeai
#pip install langchain-google-genai
#pip install langchain
#pip install langchain_community
#pip install jupyter

#export GOOGLE_API_KEY="YOUR_GOOGLE_API_KEY"

#Import Python modules
from langchain_google_genai import ChatGoogleGenerativeAI
from langchain_google_genai import GoogleGenerativeAIEmbeddings
from langchain.prompts import PromptTemplate
from langchain_community.document_loaders import PyPDFLoader
from langchain_text_splitters import CharacterTextSplitter
from langchain.chains.combine_documents import create_stuff_documents_chain
from langchain.chains import create_retrieval_chain
from langchain.vectorstores import Chroma

#Load the models
llm = ChatGoogleGenerativeAI(model="gemini-pro")
embeddings = GoogleGenerativeAIEmbeddings(model="models/embedding-001")

#Load the PDF and create chunks
loader = PyPDFLoader("handbook.pdf")
text_splitter = CharacterTextSplitter(
    separator=".",
    chunk_size=250,
    chunk_overlap=50,
    length_function=len,
    is_separator_regex=False,
)
pages = loader.load_and_split(text_splitter)

#Turn the chunks into embeddings and store them in Chroma
vectordb=Chroma.from_documents(pages,embeddings)

#Configure Chroma as a retriever with top_k=5
retriever = vectordb.as_retriever(search_kwargs={"k": 5})

#Create the retrieval chain
template = """
You are a helpful AI assistant.
Answer based on the context provided.
context: {context}
input: {input}
answer:
"""
prompt = PromptTemplate.from_template(template)
combine_docs_chain = create_stuff_documents_chain(llm, prompt)
retrieval_chain = create_retrieval_chain(retriever, combine_docs_chain)

#Invoke the retrieval chain
response=retrieval_chain.invoke({"input":"How do I apply for personal leave?"})

#Print the answer to the question
print(response["answer"])
	### Install required modules and set the envvar for Gemini API Key
	#pip install pypdf2
	#pip install chromadb
	#pip install google.generativeai
	#pip install langchain-google-genai
	#pip install langchain
	#pip install langchain_community
	#pip install jupyter

	#export GOOGLE_API_KEY="YOUR_GOOGLE_API_KEY"

	#Import Python modules
	from langchain_google_genai import ChatGoogleGenerativeAI
	from langchain_google_genai import GoogleGenerativeAIEmbeddings
	from langchain.prompts import PromptTemplate
	from langchain_community.document_loaders import PyPDFLoader
	from langchain_text_splitters import CharacterTextSplitter
	from langchain.chains.combine_documents import create_stuff_documents_chain
	from langchain.chains import create_retrieval_chain
	from langchain.vectorstores import Chroma

	#Load the models
	llm = ChatGoogleGenerativeAI(model="gemini-pro")
	embeddings = GoogleGenerativeAIEmbeddings(model="models/embedding-001")

	#Load the PDF and create chunks
	loader = PyPDFLoader("handbook.pdf")
	text_splitter = CharacterTextSplitter(
	separator=".",
	chunk_size=250,
	chunk_overlap=50,
	length_function=len,
	is_separator_regex=False,
	)
	pages = loader.load_and_split(text_splitter)

	#Turn the chunks into embeddings and store them in Chroma
	vectordb=Chroma.from_documents(pages,embeddings)

	#Configure Chroma as a retriever with top_k=5
	retriever = vectordb.as_retriever(search_kwargs={"k": 5})

	#Create the retrieval chain
	template = """
	You are a helpful AI assistant.
	Answer based on the context provided.
	context: {context}
	input: {input}
	answer:
	"""
	prompt = PromptTemplate.from_template(template)
	combine_docs_chain = create_stuff_documents_chain(llm, prompt)
	retrieval_chain = create_retrieval_chain(retriever, combine_docs_chain)

	#Invoke the retrieval chain
	response=retrieval_chain.invoke({"input":"How do I apply for personal leave?"})

	#Print the answer to the question
	print(response["answer"])