Langchain-Chatchat/configs/model_config.py

import torch.cuda
import torch.backends
import os

embedding_model_dict = {
    "ernie-tiny": "nghuyong/ernie-3.0-nano-zh",
    "ernie-base": "nghuyong/ernie-3.0-base-zh",
    "text2vec-base": "shibing624/text2vec-base-chinese",
    "text2vec": "GanymedeNil/text2vec-large-chinese",
}

# Embedding model name
EMBEDDING_MODEL = "text2vec"

# Embedding running device
EMBEDDING_DEVICE = "cuda" if torch.cuda.is_available() else "mps" if torch.backends.mps.is_available() else "cpu"

# supported LLM models
llm_model_dict = {
    "chatyuan": "ClueAI/ChatYuan-large-v2",
    "chatglm-6b-int4-qe": "THUDM/chatglm-6b-int4-qe",
    "chatglm-6b-int4": "THUDM/chatglm-6b-int4",
    "chatglm-6b-int8": "THUDM/chatglm-6b-int8",
    "chatglm-6b": "THUDM/chatglm-6b",
}

# LLM model name
LLM_MODEL = "chatglm-6b"

# LLM streaming reponse
STREAMING = True

# Use p-tuning-v2 PrefixEncoder
USE_PTUNING_V2 = False

# LLM running device
LLM_DEVICE = "cuda" if torch.cuda.is_available() else "mps" if torch.backends.mps.is_available() else "cpu"

VS_ROOT_PATH = os.path.join(os.path.dirname(os.path.dirname(__file__)), "vector_store")

UPLOAD_ROOT_PATH = os.path.join(os.path.dirname(os.path.dirname(__file__)), "content")

API_UPLOAD_ROOT_PATH = os.path.join(os.path.dirname(os.path.dirname(__file__)), "api_content")

# 基于上下文的prompt模版，请务必保留"{question}"和"{context}"
PROMPT_TEMPLATE = """已知信息：
{context} 

根据上述已知信息，简洁和专业的来回答用户的问题。如果无法从中得到答案，请说 “根据已知信息无法回答该问题” 或 “没有提供足够的相关信息”，不允许在答案中添加编造成分，答案请使用中文。 问题是：{question}"""

# 匹配后单段上下文长度
CHUNK_SIZE = 250

# LLM input history length
LLM_HISTORY_LEN = 3

# return top-k text chunk from vector store
VECTOR_SEARCH_TOP_K = 5

NLTK_DATA_PATH = os.path.join(os.path.dirname(__file__), "nltk_data")
-												修改项目架构

											
										
										
											2023-04-13 23:01:52 +08:00
+								import torch.cuda
 								import torch.backends
-												update model_config.py

											
										
										
											2023-04-25 20:14:33 +08:00
+								import os
-												修改项目架构

											
										
										
											2023-04-13 23:01:52 +08:00
 								embedding_model_dict = {
 								    "ernie-tiny": "nghuyong/ernie-3.0-nano-zh",
 								    "ernie-base": "nghuyong/ernie-3.0-base-zh",
-												update model_config.py

											
										
										
											2023-04-27 07:40:57 +08:00
+								    "text2vec-base": "shibing624/text2vec-base-chinese",
-												修改项目架构

											
										
										
											2023-04-13 23:01:52 +08:00
+								    "text2vec": "GanymedeNil/text2vec-large-chinese",
 								}
 								# Embedding model name
-												update cli_demo.py

											
										
										
											2023-04-13 23:20:45 +08:00
+								EMBEDDING_MODEL = "text2vec"
-												修改项目架构

											
										
										
											2023-04-13 23:01:52 +08:00
 								# Embedding running device
 								EMBEDDING_DEVICE = "cuda" if torch.cuda.is_available() else "mps" if torch.backends.mps.is_available() else "cpu"
 								# supported LLM models
 								llm_model_dict = {
-												update model_config.py

											
										
										
											2023-04-27 07:40:57 +08:00
+								    "chatyuan": "ClueAI/ChatYuan-large-v2",
-												修改项目架构

											
										
										
											2023-04-13 23:01:52 +08:00
+								    "chatglm-6b-int4-qe": "THUDM/chatglm-6b-int4-qe",
 								    "chatglm-6b-int4": "THUDM/chatglm-6b-int4",
-												add llm model and embedding model options in model_config.py

											
										
										
											2023-04-27 07:48:43 +08:00
+								    "chatglm-6b-int8": "THUDM/chatglm-6b-int8",
-												修改项目架构

											
										
										
											2023-04-13 23:01:52 +08:00
+								    "chatglm-6b": "THUDM/chatglm-6b",
 								}
 								# LLM model name
-												Update model_config.py
											
										
										
											2023-04-21 21:22:25 +08:00
+								LLM_MODEL = "chatglm-6b"
-												修改项目架构

											
										
										
											2023-04-13 23:01:52 +08:00
-												add streaming option in configs/model_config.py

											
										
										
											2023-05-01 17:50:16 +08:00
+								# LLM streaming reponse
 								STREAMING = True
-												Support p-tuning-v2

											
										
										
											2023-04-15 14:43:12 +08:00
+								# Use p-tuning-v2 PrefixEncoder
 								USE_PTUNING_V2 = False
-												修改项目架构

											
										
										
											2023-04-13 23:01:52 +08:00
+								# LLM running device
 								LLM_DEVICE = "cuda" if torch.cuda.is_available() else "mps" if torch.backends.mps.is_available() else "cpu"
-												add api.py

											
										
										
											2023-05-03 22:31:28 +08:00
+								VS_ROOT_PATH = os.path.join(os.path.dirname(os.path.dirname(__file__)), "vector_store")
-												update project to v0.1.3

											
										
										
											2023-04-19 23:02:47 +08:00
-												add api.py

											
										
										
											2023-05-03 22:31:28 +08:00
+								UPLOAD_ROOT_PATH = os.path.join(os.path.dirname(os.path.dirname(__file__)), "content")
-												update project to v0.1.3

											
										
										
											2023-04-19 23:02:47 +08:00
-												Use fastapi to implement API (#209)

* Use fastapi to implement API

* Update model_config.py

---------

Co-authored-by: imClumsyPanda <littlepanda0716@gmail.com>
											
										
										
											2023-05-03 21:29:28 +08:00
+								API_UPLOAD_ROOT_PATH = os.path.join(os.path.dirname(os.path.dirname(__file__)), "api_content")
-												update model_config.py

											
										
										
											2023-04-26 23:20:08 +08:00
+								# 基于上下文的prompt模版，请务必保留"{question}"和"{context}"
-												update PROMPT_TEMPLATE

											
										
										
											2023-05-02 00:28:09 +08:00
+								PROMPT_TEMPLATE = """已知信息：
-												Dev (#214)

* github: Add issue templates

* supports GPU usage in docker (#197)

* 上下文的prompt模版内容修改

---------

Co-authored-by: Calcitem <calcitem@outlook.com>
Co-authored-by: cocomany <124849750+cocomany@users.noreply.github.com>
Co-authored-by: glide-the <2533736852@qq.com>
											
										
										
											2023-05-01 23:55:37 +08:00
+								{context}
-												update PROMPT_TEMPLATE

											
										
										
											2023-05-02 00:28:09 +08:00
+								根据上述已知信息，简洁和专业的来回答用户的问题。如果无法从中得到答案，请说 “根据已知信息无法回答该问题” 或 “没有提供足够的相关信息”，不允许在答案中添加编造成分，答案请使用中文。 问题是：{question}"""
-												update text_splitter

											
										
										
											2023-04-28 00:02:42 +08:00
 								# 匹配后单段上下文长度
-												update torch_gc

											
										
										
											2023-05-04 20:48:36 +08:00
+								CHUNK_SIZE = 250
 								# LLM input history length
 								LLM_HISTORY_LEN = 3
 								# return top-k text chunk from vector store
 								VECTOR_SEARCH_TOP_K = 5
 								NLTK_DATA_PATH = os.path.join(os.path.dirname(__file__), "nltk_data")