RAG

入门操作
3 months ago · 18af8cedb0
parent 45612161d6
commit 18af8cedb0
3 changed files with 1903 additions and 0 deletions
--- a/04-多模态机器人案例/04-摘要后不清空数据库.py
+++ b/04-多模态机器人案例/04-摘要后不清空数据库.py
@ -7,6 +7,9 @@ from langchain_openai import ChatOpenAI

 from env_util import DASHSCOPE_API_KEY, DASHSCOPE_BASE_URL

+# https://www.mashibing.com/question/detail/123441
+# 聊天机器人案例BUG
+
 # 0、llm~~
 llm = ChatOpenAI(
    model = "qwen-plus",
--- a/07-RAG/01-RAG入门Demo.py
+++ b/07-RAG/01-RAG入门Demo.py
@ -0,0 +1,200 @@
+
+
+from langchain_classic.chains.combine_documents import create_stuff_documents_chain
+from langchain_classic.chains.history_aware_retriever import create_history_aware_retriever
+from langchain_classic.chains.retrieval import create_retrieval_chain
+from langchain_community.docstore import InMemoryDocstore
+from langchain_community.vectorstores import FAISS
+from langchain_core.chat_history import InMemoryChatMessageHistory
+from langchain_core.prompts import ChatPromptTemplate, MessagesPlaceholder
+from langchain_core.runnables import RunnableWithMessageHistory
+from langchain_huggingface import HuggingFaceEmbeddings
+import faiss;
+import bs4;
+from langchain_text_splitters import RecursiveCharacterTextSplitter
+from langchain_core.documents import Document
+from langchain_openai import ChatOpenAI
+from openai.types import vector_store
+
+from env_util import DASHSCOPE_API_KEY, DASHSCOPE_BASE_URL
+
+# 0、llm~~
+llm = ChatOpenAI(
+    model = "qwen-plus",
+    base_url=DASHSCOPE_BASE_URL,
+    api_key=DASHSCOPE_API_KEY,
+    temperature=0.8,
+);
+
+# 准备好向量化的对象
+model_name = "BAAI/bge-small-zh-v1.5" # 模型名
+model_kwargs = {'device': 'cpu'} # 没有显卡就用cpu，有英伟达显卡写cuda
+encode_kwargs = {'normalize_embeddings': True} # set True to compute cosine similarity
+
+#  第一次运行，会自动下载模型（去huggingface上下载），下载到hf默认的缓存目录。
+hf_embedding = HuggingFaceEmbeddings(
+    model_name=model_name,
+    model_kwargs=model_kwargs,
+    encode_kwargs=encode_kwargs
+)
+
+# 1、======================初始化数据库======================
+# 创建索引
+index = faiss.IndexFlatL2(len(hf_embedding.embed_query('Hello world!')));
+db = FAISS(
+    # 指定好初始化的Embedding的算法模型引用
+    embedding_function = hf_embedding,
+    # 索引长度
+    index = index,
+    # 内存存储文档 doc嘛，非关系型数据库
+    docstore = InMemoryDocstore(),
+    # 字典
+    index_to_docstore_id = {}
+);
+
+# 2、======================初始化数据,填充到数据库======================
+# 获取数据，截取后，把数据扔到paiss里
+def create_dense_db():
+    """把网络的关于Agent的博客数据写入向量数据库"""
+    # 页面在github，没翻墙，而且容器被拦截。。。另存为到本地玩把，。。
+    # loader = WebBaseLoader(
+    #     web_path=('https://lilianweng.github.io/posts/2023-06-23-agent/',),
+    #     bs_kwargs=dict(
+    #         #  pip install beautifulsoup4
+    #         parse_only=bs4.SoupStrainer(  # 使用BeautifulSoup解析器，只解析特定class的内容
+    #             class_=("post-content", "post-title", "post-header")  # 指定要解析的HTML类名
+    #         )
+    #     )
+    # )
+    file_path = "./agent_blog.html"
+    with open(file_path, 'r', encoding='utf-8') as f:
+        html_content = f.read()
+    print("✅ 文件读取成功 (UTF-8)。")
+
+
+
+    soup = bs4.BeautifulSoup(
+        html_content,
+        "html.parser",
+        parse_only=bs4.SoupStrainer(class_=("post-content", "post-title", "post-header"))
+    )
+
+    text_content = soup.get_text(separator="\n", strip=True)
+
+    temp_doc = Document(page_content=text_content)
+
+    # 切割
+    # 初始化文本分割器，设置块大小1000，重叠200
+    text_splitter = RecursiveCharacterTextSplitter(chunk_size=1000, chunk_overlap=200)
+    # 分割文档
+    splits = text_splitter.split_documents([temp_doc])
+
+
+    # 生成ID
+    ids = ['id' + str(i + 1) for i in range(len(splits))]
+    # 把doc写到向量数据库
+    db.add_documents(splits, ids=ids)
+    # 把数据库写入磁盘
+    db.save_local('./faiss_db')
+
+
+
+# 爬取数据扔到向量数据库里
+# create_dense_db()
+
+
+
+# 3、 ================问题上下文==============================
+# 系统提示词：用于将带有聊天历史的问题转化为独立问题
+contextualize_q_system_prompt = (
+    "给定聊天历史和最新的用户问题（可能引用聊天历史中的上下文），"
+    "将其重新表述为一个独立的问题（不需要聊天历史也能理解）。"
+    "不要回答问题，只需在需要时重新表述问题，否则保持原样。"
+)
+
+# 4、=================创建聊天提示模板====================
+contextualize_q_prompt = ChatPromptTemplate.from_messages(
+    [
+        ("system", contextualize_q_system_prompt),  # 系统角色提示
+        MessagesPlaceholder("chat_history"),  # 聊天历史占位符
+        ("human", "{input}"),  # 用户输入占位符
+    ]
+)
+
+# 创建一个向量数据库的检索器
+retriever = db.as_retriever(search_kwargs={'k': 2})
+
+# 创建一个上下文感知的检索器
+history_aware_retriever = create_history_aware_retriever(
+    llm, retriever, contextualize_q_prompt
+)
+
+
+# RAG的代码
+
+### 回答问题 ###
+# 系统提示词：定义助手的行为和回答规范
+system_prompt = (
+    "你是一个问答任务助手。"
+    "使用以下检索到的上下文来回答问题。"
+    "如果不知道答案，就说你不知道。"
+    "回答最多三句话，保持简洁。"
+    "\n\n"
+    "{context}"  # 从向量数据库中检索出来的doc
+)
+# 创建问答提示模板
+qa_prompt = ChatPromptTemplate.from_messages(
+    [
+        ("system", system_prompt),  # 系统角色提示
+        MessagesPlaceholder("chat_history"),  # 聊天历史占位符
+        ("human", "{input}"),  # 用户输入占位符
+    ]
+)
+
+
+# 创建文档处理链
+question_chain = create_stuff_documents_chain(llm, qa_prompt)
+
+# 创建RAG检索链
+rag_chain = create_retrieval_chain(history_aware_retriever, question_chain)
+
+store = {}  # 用来保存历史消息, key : 会话ID session_id
+
+def get_session_history(session_id: str):
+    """从内存中的历史消息列表中 返回当前会话 的所有历史消息"""
+    if session_id not in store:
+        store[session_id] = InMemoryChatMessageHistory()
+    return store[session_id]
+
+
+# 创建带历史记录功能的处理链
+conversational_rag_chain = RunnableWithMessageHistory(
+    rag_chain,
+    get_session_history,
+    input_messages_key='input',
+    history_messages_key='chat_history',
+    output_messages_key='answer',  # 输出消息的键
+)
+
+# 调用会话式RAG链，询问"什么是任务分解？"
+resp1 = conversational_rag_chain.invoke(
+    {"input": "What is Task Decomposition?"},  # 用户输入问题
+    config={
+        "configurable": {"session_id": "abc123"}  # 使用会话ID "abc123" 保持对话历史
+    }
+)
+
+print(resp1['answer'])
+
+
+resp2 = conversational_rag_chain.invoke(
+    {"input": "What are common ways of doing it?"},  # 用户输入问题
+    config={
+        "configurable": {"session_id": "abc123"}  # 使用会话ID "abc123" 保持对话历史
+    }
+)
+print(resp2['answer'])
+
+
+
+
--- a/07-RAG/agent_blog.html
+++ b/07-RAG/agent_blog.html