Spaces:

chengyingmo
/

ragdoing

Configuration error

App Files Files Community

ragdoing / rag /rag_class.py

chengyingmo

Upload 38 files

c604980 verified 22 days ago

raw

history blame contribute delete

6.82 kB

	from langchain_community.vectorstores import Chroma,FAISS
	from langchain_community.llms import Ollama
	from langchain_core.output_parsers import StrOutputParser
	from langchain_community.embeddings import OllamaEmbeddings
	from langchain_core.runnables import RunnablePassthrough
	from operator import itemgetter
	from langchain.prompts import ChatPromptTemplate
	from rerank_code import rerank_topn
	from Config.config import VECTOR_DB,DB_directory
	from langchain_elasticsearch.vectorstores import ElasticsearchStore


	class RAG_class:
	def __init__(self, model="qwen2:7b", embed="milkey/dmeta-embedding-zh:f16", c_name="sss1",
	persist_directory="E:/pycode/jupyter_code/langGraph/sss2/chroma.sqlite3/",es_url="http://localhost:9200"):
	template = """
	根据上下文回答以下问题,不要自己发挥，要根据以下参考内容总结答案，如果以下内容无法得到答案，就返回无法根据参考内容获取答案，

	参考内容为：{context}

	问题: {question}
	"""

	self.prompts = ChatPromptTemplate.from_template(template)

	# 使用问题扩展+结果递归方式得到最终答案
	template1 = """你是一个乐于助人的助手，可以生成与输入问题相关的多个子问题。
	目标是将输入分解为一组可以单独回答的子问题/子问题。
	生成多个与以下内容相关的搜索查询：{question}
	输出4个相关问题,以换行符隔开："""
	self.prompt_questions = ChatPromptTemplate.from_template(template1)

	# 构建问答对
	template2 = """
	以下是您需要回答的问题：

	\n--\n {question} \n---\n

	以下是任何可用的背景问答对：

	\n--\n {q_a_pairs} \n---\n

	以下是与该问题相关的其他上下文：

	\n--\n {context} \n---\n

	使用以上上下文和背景问答对来回答问题，问题是：{question} ，答案是：
	"""
	self.decomposition_prompt = ChatPromptTemplate.from_template(template2)

	self.llm = Ollama(model=model)
	self.embeding = OllamaEmbeddings(model=embed)
	if VECTOR_DB==1:
	self.vectstore = Chroma(embedding_function=self.embeding, collection_name=c_name,
	persist_directory=persist_directory)
	elif VECTOR_DB ==2:
	self.vectstore = FAISS.load_local(folder_path=persist_directory + c_name, embeddings=self.embeding,
	allow_dangerous_deserialization=True)
	elif VECTOR_DB ==3:
	self.vectstore = ElasticsearchStore(
	es_url=es_url,
	index_name=c_name,
	embedding=self.embeding
	)
	self.retriever = self.vectstore.as_retriever()
	try:
	if VECTOR_DB==1:
	self.vectstore = Chroma(embedding_function=self.embeding, collection_name=c_name,
	persist_directory=persist_directory)
	elif VECTOR_DB ==2:
	self.vectstore = FAISS.load_local(folder_path=persist_directory + c_name, embeddings=self.embeding,
	allow_dangerous_deserialization=True)
	elif VECTOR_DB ==3:
	self.vectstore = ElasticsearchStore(
	es_url=es_url,
	index_name=c_name,
	embedding=self.embeding
	)
	self.retriever = self.vectstore.as_retriever()
	except Exception as e:
	print("仅模型时无需加载数据库",e)
	#
	# Post-processing
	def format_docs(self,docs):
	return "\n\n".join(doc.page_content for doc in docs)
	# 传统方式召回，单问题召回，然后llm总结答案回答
	def simple_chain(self,question):
	_chain = (
	{"context": self.retriever\|self.format_docs,"question":RunnablePassthrough()}
	\|self.prompts
	\|self.llm
	\|StrOutputParser()
	)
	answer = _chain.invoke({"question":question})
	return answer

	def rerank_chain(self,question):
	retriever = self.vectstore.as_retriever(search_kwargs={"k": 10})
	docs = retriever.invoke(question)
	docs = rerank_topn(question,docs,N=5)
	_chain = (
	self.prompts
	\| self.llm
	\| StrOutputParser()
	)
	answer = _chain.invoke({"context":self.format_docs(docs),"question": question})
	return answer

	def format_qa_pairs(self, question, answer):
	formatted_string = ""
	formatted_string += f"Question: {question}\nAnswer:{answer}\n\n"
	return formatted_string

	# 获取问题的扩展问题
	def decomposition_chain(self, question):
	_chain = (
	{"question": RunnablePassthrough()}
	\| self.prompt_questions
	\| self.llm
	\| StrOutputParser()
	\| (lambda x: x.split("\n"))
	)

	questions = _chain.invoke({"question": question}) + [question]

	return questions
	# 多问题递归召回，每次召回后，问题和答案同时作为下一次召回的参考，再次用新问题召回
	def rag_chain(self, questions):
	q_a_pairs = ""
	for q in questions:
	_chain = (
	{"context": itemgetter("question") \| self.retriever,
	"question": itemgetter("question"),
	"q_a_pairs": itemgetter("q_a_paris")
	}
	\| self.decomposition_prompt
	\| self.llm
	\| StrOutputParser()
	)

	answer = _chain.invoke({"question": q, "q_a_paris": q_a_pairs})
	q_a_pairs = self.format_qa_pairs(q, answer)
	q_a_pairs = q_a_pairs + "\n----\n" + q_a_pairs
	return answer

	# 将聊天历史格式化为一个字符串
	def format_chat_history(self,history):
	formatted_history = ""
	for role,content in history:
	formatted_history += f"{role}: {content}\n"
	return formatted_history
	# 基于ollama大模型的大模型多轮对话，不使用知识库的
	def mult_chat(self,chat_history):
	# 格式化聊天历史
	formatted_history = self.format_chat_history(chat_history)

	# 调用模型生成回复
	response = self.llm.invoke(formatted_history)
	return response



	# if __name__ == "__main__":
	# rag = RAG_class(model="deepseek-r1:14b")
	# question = "人卫社官网网址是？"
	# questions = rag.decomposition_chain(question)
	# print(questions)
	# answer = rag.rag_chain(questions)
	# print(answer)