GLM3支持传入提示词 (#2058)

支持传入提示词的Agent ChatGLM3-6B
2023-11-14 17:45:22 +08:00 · 2023-11-14 17:45:22 +08:00 · 21b079d751
parent e78a804ec6
commit 21b079d751
5 changed files with 155 additions and 160 deletions
--- a/configs/prompt_config.py.example
+++ b/configs/prompt_config.py.example
@ -17,96 +17,118 @@
 #   - input: 用户输入内容
 #   - agent_scratchpad: Agent的思维记录
-PROMPT_TEMPLATES = {
+PROMPT_TEMPLATES = {}
    "completion": {
        "default": "{input}"
    },
-    "llm_chat": {
+PROMPT_TEMPLATES["llm_chat"] = {
-        "default": "{{ input }}",
+"default": "{{ input }}",
-
+"py":
-        "py":
+"""
-            """
+你是一个聪明的代码助手，请你给我写出简单的py代码。 \n
-        你是一个聪明的代码助手，请你给我写出简单的py代码。 \n
+{{ input }}
-        {{ input }}
+""",
-        """
+}
-        ,
+
-    },
+PROMPT_TEMPLATES["knowledge_base_chat"] = {
-
+"default":
-    "knowledge_base_chat": {
+"""
-        "default":
+<指令>根据已知信息，简洁和专业的来回答问题。如果无法从中得到答案，请说 “根据已知信息无法回答该问题”，不允许在答案中添加编造成分，答案请使用中文。 </指令>
-            """
+<已知信息>{{ context }}</已知信息>、
-        <指令>根据已知信息，简洁和专业的来回答问题。如果无法从中得到答案，请说 “根据已知信息无法回答该问题”，不允许在答案中添加编造成分，答案请使用中文。 </指令>
+<问题>{{ question }}</问题>
-        <已知信息>{{ context }}</已知信息>、
+""",
-        <问题>{{ question }}</问题>
+"text":
-        """,
+"""
-        "text":
+<指令>根据已知信息，简洁和专业的来回答问题。如果无法从中得到答案，请说 “根据已知信息无法回答该问题”，答案请使用中文。 </指令>
-            """
+<已知信息>{{ context }}</已知信息>、
-        <指令>根据已知信息，简洁和专业的来回答问题。如果无法从中得到答案，请说 “根据已知信息无法回答该问题”，答案请使用中文。 </指令>
+<问题>{{ question }}</问题>
-        <已知信息>{{ context }}</已知信息>、
+""",
-        <问题>{{ question }}</问题>
+"Empty":  # 搜不到知识库的时候使用
-        """,
+"""
-        "Empty":  # 搜不到内容的时候调用，此时没有已知信息，这个Empty可以更改，但不能删除，会影响程序使用
+请你回答我的问题:
-            """
+{{ question }}
-        <指令>请根据用户的问题，进行简洁明了的回答</指令>
+\n
-        <问题>{{ question }}</问题>
+""",
-        """,
+}
-    },
+PROMPT_TEMPLATES["search_engine_chat"] = {
-
+"default":
-    "search_engine_chat": {
+"""
-        "default":
+<指令>这是我搜索到的互联网信息，请你根据这些信息进行提取并有调理，简洁的回答问题。如果无法从中得到答案，请说 “无法搜索到能回答问题的内容”。 </指令>
-            """
+<已知信息>{{ context }}</已知信息>
-            <指令>这是我搜索到的互联网信息，请你根据这些信息进行提取并有调理，简洁的回答问题。如果无法从中得到答案，请说 “无法搜索到能回答问题的内容”。 </指令>
+<问题>{{ question }}</问题>
-            <已知信息>{{ context }}</已知信息>、
+""",
-            <问题>{{ question }}</问题>
+"search":
-            """,
+"""
-        "search":
+<指令>根据已知信息，简洁和专业的来回答问题。如果无法从中得到答案，请说 “根据已知信息无法回答该问题”，答案请使用中文。 </指令>
-            """
+<已知信息>{{ context }}</已知信息>、
-        <指令>根据已知信息，简洁和专业的来回答问题。如果无法从中得到答案，请说 “根据已知信息无法回答该问题”，答案请使用中文。 </指令>
+<问题>{{ question }}</问题>
-        <已知信息>{{ context }}</已知信息>、
+""",
-        <问题>{{ question }}</问题>
+}
-        """,
+PROMPT_TEMPLATES["agent_chat"] = {
-        "Empty":  # 搜不到内容的时候调用，此时没有已知信息，这个Empty可以更改，但不能删除，会影响程序使用
+"default":
-            """
+"""
-        <指令>请根据用户的问题，进行简洁明了的回答</指令>
+Answer the following questions as best you can. If it is in order, you can use some tools appropriately.You have access to the following tools:
-        <问题>{{ question }}</问题>
+
-        """,
+{tools}
-    },
+
-
+Please note that the "知识库查询工具" is information about the "西交利物浦大学" ,and if a question is asked about it, you must answer with the knowledge base，
-    "agent_chat": {
+Please note that the "天气查询工具" can only be used once since Question begin.
-        "default":
+
-            """
+Use the following format:
-        Answer the following questions as best you can. If it is in order, you can use some tools appropriately.You have access to the following tools:
+Question: the input question you must answer1
-
+Thought: you should always think about what to do and what tools to use.
-        {tools}
+Action: the action to take, should be one of [{tool_names}]
-
+Action Input: the input to the action
-        Please note that the "知识库查询工具" is information about the "西交利物浦大学" ,and if a question is asked about it, you must answer with the knowledge base，
+Observation: the result of the action
-        Please note that the "天气查询工具" can only be used once since Question begin.
+... (this Thought/Action/Action Input/Observation can be repeated zero or more times)
-
+Thought: I now know the final answer
-        Use the following format:
+Final Answer: the final answer to the original input question
-        Question: the input question you must answer1
+Begin!
-        Thought: you should always think about what to do and what tools to use.
+
-        Action: the action to take, should be one of [{tool_names}]
+history: {history}
-        Action Input: the input to the action
+
-        Observation: the result of the action
+Question: {input}
-        ... (this Thought/Action/Action Input/Observation can be repeated zero or more times)
+
-        Thought: I now know the final answer
+Thought: {agent_scratchpad}
-        Final Answer: the final answer to the original input question
+""",
-
+
-
+"ChatGLM3":
-        Begin!
+"""
-        history:
+You can answer using the tools, or answer directly using your knowledge without using the tools.Respond to the human as helpfully and accurately as possible.
-        {history}
+You have access to the following tools:
-        Question: {input}
+{tools}
-        Thought: {agent_scratchpad}
+Use a json blob to specify a tool by providing an action key (tool name) and an action_input key (tool input).
-        """,
+Valid "action" values: "Final Answer" or  [{tool_names}]
-
+Provide only ONE action per $JSON_BLOB, as shown:
-        "ChatGLM3":   # ChatGLM3必须用官方的提示词，没有修改空间，目前参数都不会传入进去
+
-        """
+```
-        history:
+{{{{
-        {history}
+  "action": $TOOL_NAME,
-        Question: {input}
+  "action_input": $INPUT
-        Thought: {agent_scratchpad}
+}}}}
-        """,
+```
-    },
+
 Follow this format:
 Question: input question to answer
 Thought: consider previous and subsequent steps
 Action:
 ```
 $JSON_BLOB
 ```
 Observation: action result
 ... (repeat Thought/Action/Observation N times)
 Thought: I know what to respond
 Action:
 ```
 {{{{
  "action": "Final Answer",
  "action_input": "Final response to human"
 }}}}
 Begin! Reminder to ALWAYS respond with a valid json blob of a single action. Use tools if necessary. Respond directly if appropriate. Format is Action:```$JSON_BLOB```then Observation:.
 history: {history}
 Question: {input}
 Thought: {agent_scratchpad}
 """,
 }
--- a/server/agent/custom_agent/ChatGLM3Agent.py
+++ b/server/agent/custom_agent/ChatGLM3Agent.py
@ -1,11 +1,11 @@
 """
 This file is a modified version for ChatGLM3-6B the original ChatGLM3Agent.py file from the langchain repo.
 """
 from __future__ import annotations
 import yaml
 from langchain.agents.structured_chat.output_parser import StructuredChatOutputParser
 from langchain.memory import ConversationBufferWindowMemory
 from typing import Any, List, Sequence, Tuple, Optional, Union
 import os
 from langchain.agents.agent import Agent
@ -13,7 +13,7 @@ from langchain.chains.llm import LLMChain
 from langchain.prompts.chat import (
    ChatPromptTemplate,
    HumanMessagePromptTemplate,
-    SystemMessagePromptTemplate,
+    SystemMessagePromptTemplate, MessagesPlaceholder,
 )
 import json
 import logging
@ -26,45 +26,6 @@ from langchain.callbacks.base import BaseCallbackManager
 from langchain.schema.language_model import BaseLanguageModel
 from langchain.tools.base import BaseTool
 PREFIX = """
 You can answer using the tools, or answer directly using your knowledge without using the tools.
 Respond to the human as helpfully and accurately as possible.
 You have access to the following tools:
 """
 FORMAT_INSTRUCTIONS = """Use a json blob to specify a tool by providing an action key (tool name) and an action_input key (tool input).
 Valid "action" values: "Final Answer" or {tool_names}
 Provide only ONE action per $JSON_BLOB, as shown:
 ```
 {{{{
  "action": $TOOL_NAME,
  "action_input": $INPUT
 }}}}
 ```
 Follow this format:
 Question: input question to answer
 Thought: consider previous and subsequent steps
 Action:
 ```
 $JSON_BLOB
 ```
 Observation: action result
 ... (repeat Thought/Action/Observation N times)
 Thought: I know what to respond
 Action:
 ```
 {{{{
  "action": "Final Answer",
  "action_input": "Final response to human"
 }}}}
 ```"""
 SUFFIX = """Begin! Reminder to ALWAYS respond with a valid json blob of a single action. Use tools if necessary. Respond directly if appropriate. Format is Action:```$JSON_BLOB```then Observation:.
 Thought:"""
 HUMAN_MESSAGE_TEMPLATE = "{input}\n\n{agent_scratchpad}"
 logger = logging.getLogger(__name__)
@ -77,9 +38,6 @@ class StructuredChatOutputParserWithRetries(AgentOutputParser):
    output_fixing_parser: Optional[OutputFixingParser] = None
    """The output fixing parser to use."""
    def get_format_instructions(self) -> str:
        return FORMAT_INSTRUCTIONS
    def parse(self, text: str) -> Union[AgentAction, AgentFinish]:
        special_tokens = ["Action:", "<|observation|>"]
        first_index = min([text.find(token) if token in text else len(text) for token in special_tokens])
@ -112,6 +70,7 @@ Action:
            return parsed_obj
        except Exception as e:
            raise OutputParserException(f"Could not parse LLM output: {text}") from e
    @property
    def _type(self) -> str:
        return "structured_chat_ChatGLM3_6b_with_retries"
@ -168,47 +127,57 @@ class StructuredGLM3ChatAgent(Agent):
    def create_prompt(
            cls,
            tools: Sequence[BaseTool],
-            prefix: str = PREFIX,
+            prompt: str = None,
            suffix: str = SUFFIX,
            human_message_template: str = HUMAN_MESSAGE_TEMPLATE,
            format_instructions: str = FORMAT_INSTRUCTIONS,
            input_variables: Optional[List[str]] = None,
            memory_prompts: Optional[List[BasePromptTemplate]] = None,
    ) -> BasePromptTemplate:
        def tool_config_from_file(tool_name, directory="server/agent/tools/"):
-            """search tool yaml and return json format"""
+            """search tool yaml and return simplified json format"""
            file_path = os.path.join(directory, f"{tool_name.lower()}.yaml")
            try:
                with open(file_path, 'r', encoding='utf-8') as file:
-                    return yaml.safe_load(file)
+                    tool_config = yaml.safe_load(file)
                    # Simplify the structure if needed
                    simplified_config = {
                        "name": tool_config.get("name", ""),
                        "description": tool_config.get("description", ""),
                        "parameters": tool_config.get("parameters", {})
                    }
                    return simplified_config
            except FileNotFoundError:
-                print(f"File not found: {file_path}")
+                logger.error(f"File not found: {file_path}")
                return None
            except Exception as e:
-                print(f"An error occurred while reading {file_path}: {e}")
+                logger.error(f"An error occurred while reading {file_path}: {e}")
                return None
        tools_json = []
-        tool_names = ""
+        tool_names = []
        for tool in tools:
            tool_config = tool_config_from_file(tool.name)
            if tool_config:
                tools_json.append(tool_config)
-                tool_names.join(tool.name + ", ")
+                tool_names.append(tool.name)
        # Format the tools for output
        formatted_tools = "\n".join([
-            json.dumps(tool, ensure_ascii=False).replace("\"", "\\\"").replace("{", "{{").replace("}", "}}")
+            f"{tool['name']}: {tool['description']}, args: {tool['parameters']}"
            for tool in tools_json
        ])
-        format_instructions = format_instructions.format(tool_names=tool_names)
+        formatted_tools = formatted_tools.replace("'", "\\'").replace("{", "{{").replace("}", "}}")
-        template = "\n\n".join([prefix, formatted_tools, format_instructions, suffix])
+
        template = prompt.format(tool_names=tool_names,
                                 tools=formatted_tools,
                                 history="{history}",
                                 input="{input}",
                                 agent_scratchpad="{agent_scratchpad}")
        if input_variables is None:
            input_variables = ["input", "agent_scratchpad"]
        _memory_prompts = memory_prompts or []
        messages = [
            SystemMessagePromptTemplate.from_template(template),
            *_memory_prompts,
            HumanMessagePromptTemplate.from_template(human_message_template),
        ]
        return ChatPromptTemplate(input_variables=input_variables, messages=messages)
@ -217,12 +186,10 @@ class StructuredGLM3ChatAgent(Agent):
            cls,
            llm: BaseLanguageModel,
            tools: Sequence[BaseTool],
            prompt: str = None,
            callback_manager: Optional[BaseCallbackManager] = None,
            output_parser: Optional[AgentOutputParser] = None,
            prefix: str = PREFIX,
            suffix: str = SUFFIX,
            human_message_template: str = HUMAN_MESSAGE_TEMPLATE,
            format_instructions: str = FORMAT_INSTRUCTIONS,
            input_variables: Optional[List[str]] = None,
            memory_prompts: Optional[List[BasePromptTemplate]] = None,
            **kwargs: Any,
@ -231,10 +198,7 @@ class StructuredGLM3ChatAgent(Agent):
        cls._validate_tools(tools)
        prompt = cls.create_prompt(
            tools,
-            prefix=prefix,
+            prompt=prompt,
            suffix=suffix,
            human_message_template=human_message_template,
            format_instructions=format_instructions,
            input_variables=input_variables,
            memory_prompts=memory_prompts,
        )
@ -260,7 +224,9 @@ class StructuredGLM3ChatAgent(Agent):
 def initialize_glm3_agent(
        tools: Sequence[BaseTool],
        llm: BaseLanguageModel,
        prompt: str = None,
        callback_manager: Optional[BaseCallbackManager] = None,
        memory: Optional[ConversationBufferWindowMemory] = None,
        agent_kwargs: Optional[dict] = None,
        *,
        tags: Optional[Sequence[str]] = None,
@ -269,12 +235,17 @@ def initialize_glm3_agent(
    tags_ = list(tags) if tags else []
    agent_kwargs = agent_kwargs or {}
    agent_obj = StructuredGLM3ChatAgent.from_llm_and_tools(
-        llm, tools, callback_manager=callback_manager, **agent_kwargs
+        llm=llm,
        tools=tools,
        prompt=prompt,
        callback_manager=callback_manager, **agent_kwargs
    )
    return AgentExecutor.from_agent_and_tools(
        agent=agent_obj,
        tools=tools,
        callback_manager=callback_manager,
        memory=memory,
        tags=tags_,
        **kwargs,
    )
--- a/server/agent/custom_template.py
+++ b/server/agent/custom_template.py
@ -21,7 +21,6 @@ class CustomPromptTemplate(StringPromptTemplate):
        kwargs["tool_names"] = ", ".join([tool.name for tool in self.tools])
        return self.template.format(**kwargs)
 class CustomOutputParser(AgentOutputParser):
    begin: bool = False
    def __init__(self):
--- a/server/chat/agent_chat.py
+++ b/server/chat/agent_chat.py
@ -91,8 +91,11 @@ async def agent_chat(query: str = Body(..., description="用户输入", examples
                llm=model,
                tools=tools,
                callback_manager=None,
-                verbose=True,
+                # Langchain Prompt is not constructed directly here, it is constructed inside the GLM3 agent.
                prompt=prompt_template,
                input_variables=["input", "intermediate_steps", "history"],
                memory=memory,
                verbose=True,
            )
        else:
            agent = LLMSingleActionAgent(
--- a/server/utils.py
+++ b/server/utils.py
@ -9,7 +9,7 @@ from configs import (LLM_MODELS, LLM_DEVICE, EMBEDDING_DEVICE,
                     FSCHAT_MODEL_WORKERS, HTTPX_DEFAULT_TIMEOUT)
 import os
 from concurrent.futures import ThreadPoolExecutor, as_completed
-from langchain.chat_models import ChatOpenAI, AzureChatOpenAI, ChatAnthropic
+from langchain.chat_models import ChatOpenAI
 from langchain.llms import OpenAI, AzureOpenAI, Anthropic
 import httpx
 from typing import Literal, Optional, Callable, Generator, Dict, Any, Awaitable, Union