Langchain-Chatchat/models/chatglm_llm.py


from abc import ABC

from langchain.llms.base import LLM
from typing import Optional, List
from models.loader import LoaderCheckPoint
from models.base import (BaseAnswer,
                         AnswerResult,
                         AnswerResultStream,
                         AnswerResultQueueSentinelTokenListenerQueue)


import transformers


class ChatGLM(BaseAnswer, LLM, ABC):
    max_token: int = 10000
    temperature: float = 0.01
    top_p = 0.9
    checkPoint: LoaderCheckPoint = None
    # history = []
    history_len: int = 10

    def __init__(self, checkPoint: LoaderCheckPoint = None):
        super().__init__()
        self.checkPoint = checkPoint

    @property
    def _llm_type(self) -> str:
        return "ChatGLM"

    @property
    def _check_point(self) -> LoaderCheckPoint:
        return self.checkPoint

    @property
    def _history_len(self) -> int:
        return self.history_len

    def set_history_len(self, history_len: int = 10) -> None:
        self.history_len = history_len

    def _call(self, prompt: str, stop: Optional[List[str]] = None) -> str:
        pass

    def _generate_answer(self, prompt: str,
                         history: List[List[str]] = [],
                         streaming: bool = False,
                         generate_with_callback: AnswerResultStream = None) -> None:
        # Create the StoppingCriteriaList with the stopping strings
        stopping_criteria_list = transformers.StoppingCriteriaList()
        # 定义模型stopping_criteria 队列，在每次响应时将 torch.LongTensor, torch.FloatTensor同步到AnswerResult
        listenerQueue = AnswerResultQueueSentinelTokenListenerQueue()
        stopping_criteria_list.append(listenerQueue)

        if streaming:
            history += [[]]
            for inum, (stream_resp, _) in enumerate(self.checkPoint.model.stream_chat(
                    self.checkPoint.tokenizer,
                    prompt,
                    history=history[-self.history_len:-1] if self.history_len > 0 else [],
                    max_length=self.max_token,
                    temperature=self.temperature,
                    stopping_criteria=stopping_criteria_list
            )):
                self.checkPoint.clear_torch_cache()
                history[-1] = [prompt, stream_resp]
                answer_result = AnswerResult()
                answer_result.history = history
                answer_result.llm_output = {"answer": stream_resp}
                if listenerQueue.listenerQueue.__len__() > 0:
                    answer_result.listenerToken = listenerQueue.listenerQueue.pop()
                generate_with_callback(answer_result)
        else:
            response, _ = self.checkPoint.model.chat(
                self.checkPoint.tokenizer,
                prompt,
                history=history[-self.history_len:] if self.history_len > 0 else [],
                max_length=self.max_token,
                temperature=self.temperature,
                stopping_criteria=stopping_criteria_list
            )
            self.checkPoint.clear_torch_cache()
            history += [[prompt, response]]
            answer_result = AnswerResult()
            answer_result.history = history
            answer_result.llm_output = {"answer": response}
            if listenerQueue.listenerQueue.__len__() > 0:
                answer_result.listenerToken = listenerQueue.listenerQueue.pop()

            generate_with_callback(answer_result)
llm_model_dict 处理了loader的一些预设行为，如加载位置，模型名称，模型处理器实例, 定义checkpoint名称和远程路径 loader.py: 模型重载定义 generatorAnswer 增加 AnswerResultStream 定义generate_with_callback收集器，在每次响应时将队列数据同步到AnswerResult requirements.txt 变更项目依赖 2023-05-18 22:54:41 +08:00
			`from abc import ABC`

first commit 2023-03-31 20:09:40 +08:00			`from langchain.llms.base import LLM`
llm_model_dict 处理了loader的一些预设行为，如加载位置，模型名称，模型处理器实例, 定义checkpoint名称和远程路径 loader.py: 模型重载定义 generatorAnswer 增加 AnswerResultStream 定义generate_with_callback收集器，在每次响应时将队列数据同步到AnswerResult requirements.txt 变更项目依赖 2023-05-18 22:54:41 +08:00			`from typing import Optional, List`
			`from models.loader import LoaderCheckPoint`
			`from models.base import (BaseAnswer,`
			`AnswerResult,`
			`AnswerResultStream,`
			`AnswerResultQueueSentinelTokenListenerQueue)`


			`import transformers`


			`class ChatGLM(BaseAnswer, LLM, ABC):`
first commit 2023-03-31 20:09:40 +08:00			`max_token: int = 10000`
llm_model_dict 处理了loader的一些预设行为，如加载位置，模型名称，模型处理器实例, 定义checkpoint名称和远程路径 loader.py: 模型重载定义 generatorAnswer 增加 AnswerResultStream 定义generate_with_callback收集器，在每次响应时将队列数据同步到AnswerResult requirements.txt 变更项目依赖 2023-05-18 22:54:41 +08:00			`temperature: float = 0.01`
first commit 2023-03-31 20:09:40 +08:00			`top_p = 0.9`
llm_model_dict 处理了loader的一些预设行为，如加载位置，模型名称，模型处理器实例, 定义checkpoint名称和远程路径 loader.py: 模型重载定义 generatorAnswer 增加 AnswerResultStream 定义generate_with_callback收集器，在每次响应时将队列数据同步到AnswerResult requirements.txt 变更项目依赖 2023-05-18 22:54:41 +08:00			`checkPoint: LoaderCheckPoint = None`
add stream support to cli_demo.py 2023-04-26 22:29:20 +08:00			`# history = []`
use RetrievalQA instead of ChatVectorDBChain 2023-04-10 22:55:22 +08:00			`history_len: int = 10`
first commit 2023-03-31 20:09:40 +08:00
llm_model_dict 处理了loader的一些预设行为，如加载位置，模型名称，模型处理器实例, 定义checkpoint名称和远程路径 loader.py: 模型重载定义 generatorAnswer 增加 AnswerResultStream 定义generate_with_callback收集器，在每次响应时将队列数据同步到AnswerResult requirements.txt 变更项目依赖 2023-05-18 22:54:41 +08:00			`def __init__(self, checkPoint: LoaderCheckPoint = None):`
first commit 2023-03-31 20:09:40 +08:00			`super().__init__()`
llm_model_dict 处理了loader的一些预设行为，如加载位置，模型名称，模型处理器实例, 定义checkpoint名称和远程路径 loader.py: 模型重载定义 generatorAnswer 增加 AnswerResultStream 定义generate_with_callback收集器，在每次响应时将队列数据同步到AnswerResult requirements.txt 变更项目依赖 2023-05-18 22:54:41 +08:00			`self.checkPoint = checkPoint`
first commit 2023-03-31 20:09:40 +08:00
			`@property`
			`def _llm_type(self) -> str:`
			`return "ChatGLM"`

llm_model_dict 处理了loader的一些预设行为，如加载位置，模型名称，模型处理器实例, 定义checkpoint名称和远程路径 loader.py: 模型重载定义 generatorAnswer 增加 AnswerResultStream 定义generate_with_callback收集器，在每次响应时将队列数据同步到AnswerResult requirements.txt 变更项目依赖 2023-05-18 22:54:41 +08:00			`@property`
			`def _check_point(self) -> LoaderCheckPoint:`
			`return self.checkPoint`

			`@property`
			`def _history_len(self) -> int:`
			`return self.history_len`

			`def set_history_len(self, history_len: int = 10) -> None:`
			`self.history_len = history_len`

			`def _call(self, prompt: str, stop: Optional[List[str]] = None) -> str:`
			`pass`

			`def _generate_answer(self, prompt: str,`
			`history: List[List[str]] = [],`
			`streaming: bool = False,`
			`generate_with_callback: AnswerResultStream = None) -> None:`
			`# Create the StoppingCriteriaList with the stopping strings`
			`stopping_criteria_list = transformers.StoppingCriteriaList()`
			`# 定义模型stopping_criteria 队列，在每次响应时将 torch.LongTensor, torch.FloatTensor同步到AnswerResult`
			`listenerQueue = AnswerResultQueueSentinelTokenListenerQueue()`
			`stopping_criteria_list.append(listenerQueue)`

add streaming option in configs/model_config.py 2023-05-01 23:51:29 +08:00			`if streaming:`
fix bug : 1、历史最后一条丢失；2、上下两行连读造成歧义 (#415) * fix _call bug * fix * fix bug : 上下两行连读造成歧义 2023-05-20 01:19:22 +08:00			`history += [[]]`
llm_model_dict 处理了loader的一些预设行为，如加载位置，模型名称，模型处理器实例, 定义checkpoint名称和远程路径 loader.py: 模型重载定义 generatorAnswer 增加 AnswerResultStream 定义generate_with_callback收集器，在每次响应时将队列数据同步到AnswerResult requirements.txt 变更项目依赖 2023-05-18 22:54:41 +08:00			`for inum, (stream_resp, _) in enumerate(self.checkPoint.model.stream_chat(`
			`self.checkPoint.tokenizer,`
add stream support to cli_demo.py 2023-04-26 22:29:20 +08:00			`prompt,`
add stream support to webui.py 2023-04-26 23:19:11 +08:00			`history=history[-self.history_len:-1] if self.history_len > 0 else [],`
add stream support to cli_demo.py 2023-04-26 22:29:20 +08:00			`max_length=self.max_token,`
			`temperature=self.temperature,`
llm_model_dict 处理了loader的一些预设行为，如加载位置，模型名称，模型处理器实例, 定义checkpoint名称和远程路径 loader.py: 模型重载定义 generatorAnswer 增加 AnswerResultStream 定义generate_with_callback收集器，在每次响应时将队列数据同步到AnswerResult requirements.txt 变更项目依赖 2023-05-18 22:54:41 +08:00			`stopping_criteria=stopping_criteria_list`
add stream support to webui.py 2023-04-26 23:19:11 +08:00			`)):`
llm_model_dict 处理了loader的一些预设行为，如加载位置，模型名称，模型处理器实例, 定义checkpoint名称和远程路径 loader.py: 模型重载定义 generatorAnswer 增加 AnswerResultStream 定义generate_with_callback收集器，在每次响应时将队列数据同步到AnswerResult requirements.txt 变更项目依赖 2023-05-18 22:54:41 +08:00			`self.checkPoint.clear_torch_cache()`
fix bug : 1、历史最后一条丢失；2、上下两行连读造成歧义 (#415) * fix _call bug * fix * fix bug : 上下两行连读造成歧义 2023-05-20 01:19:22 +08:00			`history[-1] = [prompt, stream_resp]`
llm_model_dict 处理了loader的一些预设行为，如加载位置，模型名称，模型处理器实例, 定义checkpoint名称和远程路径 loader.py: 模型重载定义 generatorAnswer 增加 AnswerResultStream 定义generate_with_callback收集器，在每次响应时将队列数据同步到AnswerResult requirements.txt 变更项目依赖 2023-05-18 22:54:41 +08:00			`answer_result = AnswerResult()`
			`answer_result.history = history`
			`answer_result.llm_output = {"answer": stream_resp}`
			`if listenerQueue.listenerQueue.__len__() > 0:`
			`answer_result.listenerToken = listenerQueue.listenerQueue.pop()`
			`generate_with_callback(answer_result)`
update chatglm_llm.py 2023-04-23 22:13:20 +08:00			`else:`
llm_model_dict 处理了loader的一些预设行为，如加载位置，模型名称，模型处理器实例, 定义checkpoint名称和远程路径 loader.py: 模型重载定义 generatorAnswer 增加 AnswerResultStream 定义generate_with_callback收集器，在每次响应时将队列数据同步到AnswerResult requirements.txt 变更项目依赖 2023-05-18 22:54:41 +08:00			`response, _ = self.checkPoint.model.chat(`
			`self.checkPoint.tokenizer,`
可选择lora权重加载 (#231) * Add files via upload 增加lora权重使用 * Update model_config.py * Add files via upload 修复一个小错误，少写了模型加载 * 使用lora微调的权重使用lora微调的权重 * Update model_config.py 2023-05-04 21:01:55 +08:00			`prompt,`
			`history=history[-self.history_len:] if self.history_len > 0 else [],`
			`max_length=self.max_token,`
			`temperature=self.temperature,`
llm_model_dict 处理了loader的一些预设行为，如加载位置，模型名称，模型处理器实例, 定义checkpoint名称和远程路径 loader.py: 模型重载定义 generatorAnswer 增加 AnswerResultStream 定义generate_with_callback收集器，在每次响应时将队列数据同步到AnswerResult requirements.txt 变更项目依赖 2023-05-18 22:54:41 +08:00			`stopping_criteria=stopping_criteria_list`
update chatglm_llm.py 2023-04-23 22:13:20 +08:00			`)`
llm_model_dict 处理了loader的一些预设行为，如加载位置，模型名称，模型处理器实例, 定义checkpoint名称和远程路径 loader.py: 模型重载定义 generatorAnswer 增加 AnswerResultStream 定义generate_with_callback收集器，在每次响应时将队列数据同步到AnswerResult requirements.txt 变更项目依赖 2023-05-18 22:54:41 +08:00			`self.checkPoint.clear_torch_cache()`
add streaming option in configs/model_config.py 2023-05-01 23:51:29 +08:00			`history += [[prompt, response]]`
llm_model_dict 处理了loader的一些预设行为，如加载位置，模型名称，模型处理器实例, 定义checkpoint名称和远程路径 loader.py: 模型重载定义 generatorAnswer 增加 AnswerResultStream 定义generate_with_callback收集器，在每次响应时将队列数据同步到AnswerResult requirements.txt 变更项目依赖 2023-05-18 22:54:41 +08:00			`answer_result = AnswerResult()`
			`answer_result.history = history`
			`answer_result.llm_output = {"answer": response}`
			`if listenerQueue.listenerQueue.__len__() > 0:`
			`answer_result.listenerToken = listenerQueue.listenerQueue.pop()`

			`generate_with_callback(answer_result)`