Langchain-Chatchat/configs/server_config.py.example

from configs.model_config import LLM_DEVICE
import httpx

# httpx 请求默认超时时间（秒）。如果加载模型或对话较慢，出现超时错误，可以适当加大该值。
HTTPX_DEFAULT_TIMEOUT = 300.0

# API 是否开启跨域，默认为False，如果需要开启，请设置为True
# is open cross domain
OPEN_CROSS_DOMAIN = False

# 各服务器默认绑定host。如改为"0.0.0.0"需要修改下方所有XX_SERVER的host
DEFAULT_BIND_HOST = "127.0.0.1"

# webui.py server
WEBUI_SERVER = {
    "host": DEFAULT_BIND_HOST,
    "port": 8501,
}

# api.py server
API_SERVER = {
    "host": DEFAULT_BIND_HOST,
    "port": 7861,
}

# fastchat openai_api server
FSCHAT_OPENAI_API = {
    "host": DEFAULT_BIND_HOST,
    "port": 20000,
}

# fastchat model_worker server
# 这些模型必须是在model_config.MODEL_PATH或ONLINE_MODEL中正确配置的。
# 在启动startup.py时，可用通过`--model-worker --model-name xxxx`指定模型，不指定则为LLM_MODEL
FSCHAT_MODEL_WORKERS = {
    # 所有模型共用的默认配置，可在模型专项配置中进行覆盖。
    "default": {
        "host": DEFAULT_BIND_HOST,
        "port": 20002,
        "device": LLM_DEVICE,

        # 多卡加载需要配置的参数
        # "gpus": None, # 使用的GPU，以str的格式指定，如"0,1"
        # "num_gpus": 1, # 使用GPU的数量
        # "max_gpu_memory": "20GiB", # 每个GPU占用的最大显存

        # 以下为非常用参数，可根据需要配置
        # "load_8bit": False, # 开启8bit量化
        # "cpu_offloading": None,
        # "gptq_ckpt": None,
        # "gptq_wbits": 16,
        # "gptq_groupsize": -1,
        # "gptq_act_order": False,
        # "awq_ckpt": None,
        # "awq_wbits": 16,
        # "awq_groupsize": -1,
        # "model_names": [LLM_MODEL],
        # "conv_template": None,
        # "limit_worker_concurrency": 5,
        # "stream_interval": 2,
        # "no_register": False,
        # "embed_in_truncate": False,
    },
    "baichuan-7b": { # 使用default中的IP和端口
        "device": "cpu",
    },
    "zhipu-api": { # 请为每个要运行的在线API设置不同的端口
        "port": 21001,
    },
    "minimax-api": {
        "port": 21002,
    },
    "xinghuo-api": {
        "port": 21003,
    },
    "qianfan-api": {
        "port": 21004,
    },
}

# fastchat multi model worker server
FSCHAT_MULTI_MODEL_WORKERS = {
    # TODO:
}

# fastchat controller server
FSCHAT_CONTROLLER = {
    "host": DEFAULT_BIND_HOST,
    "port": 20001,
    "dispatch_method": "shortest_queue",
}
-												优化configs (#1474)

* remove llm_model_dict

* optimize configs

* fix get_model_path

* 更改一些默认参数，添加千帆的默认配置

* Update server_config.py.example
											
										
										
											2023-09-15 17:52:22 +08:00
+								from configs.model_config import LLM_DEVICE
-												添加切换模型功能，支持智谱AI在线模型 (#1342)

* 添加LLM模型切换功能，需要在server_config中设置可切换的模型
* add tests for api.py/llm_model/*
* - 支持模型切换
- 支持智普AI线上模型
- startup.py增加参数`--api-worker`，自动运行所有的线上API模型。使用`-a
  (--all-webui), --all-api`时默认开启该选项
* 修复被fastchat覆盖的标准输出
* 对fastchat日志进行更细致的控制，startup.py中增加-q(--quiet)开关，可以减少无用的fastchat日志输出
* 修正chatglm api的对话模板


Co-authored-by: liunux4odoo <liunu@qq.com>
											
										
										
											2023-09-01 23:58:09 +08:00
+								import httpx
 								# httpx 请求默认超时时间（秒）。如果加载模型或对话较慢，出现超时错误，可以适当加大该值。
 								HTTPX_DEFAULT_TIMEOUT = 300.0
-												add startup.py: start specified servers with one command. see python startup.py --help

											
										
										
											2023-08-17 13:24:53 +08:00
 								# API 是否开启跨域，默认为False，如果需要开启，请设置为True
 								# is open cross domain
 								OPEN_CROSS_DOMAIN = False
-												优化configs (#1474)

* remove llm_model_dict

* optimize configs

* fix get_model_path

* 更改一些默认参数，添加千帆的默认配置

* Update server_config.py.example
											
										
										
											2023-09-15 17:52:22 +08:00
+								# 各服务器默认绑定host。如改为"0.0.0.0"需要修改下方所有XX_SERVER的host
-												add startup.py: start specified servers with one command. see python startup.py --help

											
										
										
											2023-08-17 13:24:53 +08:00
+								DEFAULT_BIND_HOST = "127.0.0.1"
 								# webui.py server
 								WEBUI_SERVER = {
 								    "host": DEFAULT_BIND_HOST,
 								    "port": 8501,
 								}
 								# api.py server
 								API_SERVER = {
 								    "host": DEFAULT_BIND_HOST,
 								    "port": 7861,
 								}
 								# fastchat openai_api server
 								FSCHAT_OPENAI_API = {
 								    "host": DEFAULT_BIND_HOST,
-												优化configs (#1474)

* remove llm_model_dict

* optimize configs

* fix get_model_path

* 更改一些默认参数，添加千帆的默认配置

* Update server_config.py.example
											
										
										
											2023-09-15 17:52:22 +08:00
+								    "port": 20000,
-												add startup.py: start specified servers with one command. see python startup.py --help

											
										
										
											2023-08-17 13:24:53 +08:00
+								}
 								# fastchat model_worker server
-												优化configs (#1474)

* remove llm_model_dict

* optimize configs

* fix get_model_path

* 更改一些默认参数，添加千帆的默认配置

* Update server_config.py.example
											
										
										
											2023-09-15 17:52:22 +08:00
+								# 这些模型必须是在model_config.MODEL_PATH或ONLINE_MODEL中正确配置的。
-												add startup.py: start specified servers with one command. see python startup.py --help

											
										
										
											2023-08-17 13:24:53 +08:00
+								# 在启动startup.py时，可用通过`--model-worker --model-name xxxx`指定模型，不指定则为LLM_MODEL
 								FSCHAT_MODEL_WORKERS = {
-												优化configs (#1474)

* remove llm_model_dict

* optimize configs

* fix get_model_path

* 更改一些默认参数，添加千帆的默认配置

* Update server_config.py.example
											
										
										
											2023-09-15 17:52:22 +08:00
+								    # 所有模型共用的默认配置，可在模型专项配置中进行覆盖。
-												添加切换模型功能，支持智谱AI在线模型 (#1342)

* 添加LLM模型切换功能，需要在server_config中设置可切换的模型
* add tests for api.py/llm_model/*
* - 支持模型切换
- 支持智普AI线上模型
- startup.py增加参数`--api-worker`，自动运行所有的线上API模型。使用`-a
  (--all-webui), --all-api`时默认开启该选项
* 修复被fastchat覆盖的标准输出
* 对fastchat日志进行更细致的控制，startup.py中增加-q(--quiet)开关，可以减少无用的fastchat日志输出
* 修正chatglm api的对话模板


Co-authored-by: liunux4odoo <liunu@qq.com>
											
										
										
											2023-09-01 23:58:09 +08:00
+								    "default": {
-												add startup.py: start specified servers with one command. see python startup.py --help

											
										
										
											2023-08-17 13:24:53 +08:00
+								        "host": DEFAULT_BIND_HOST,
 								        "port": 20002,
 								        "device": LLM_DEVICE,
-												添加切换模型功能，支持智谱AI在线模型 (#1342)

* 添加LLM模型切换功能，需要在server_config中设置可切换的模型
* add tests for api.py/llm_model/*
* - 支持模型切换
- 支持智普AI线上模型
- startup.py增加参数`--api-worker`，自动运行所有的线上API模型。使用`-a
  (--all-webui), --all-api`时默认开启该选项
* 修复被fastchat覆盖的标准输出
* 对fastchat日志进行更细致的控制，startup.py中增加-q(--quiet)开关，可以减少无用的fastchat日志输出
* 修正chatglm api的对话模板


Co-authored-by: liunux4odoo <liunu@qq.com>
											
										
										
											2023-09-01 23:58:09 +08:00
 								        # 多卡加载需要配置的参数
-												优化server_config配置项 (#1293)

* update server_config.py:
- 在model_config中增加HISTORY_LEN配置参数
- 将server_config中helper function移动到server.utils中
- 统一set_httpx_timeout的定义和调用

* update webui.py:
应用model_config中的配置项：HISTORY_LEN,VECTOR_SEARCH_TOP_K,SEARCH_ENGINE_TOP_K

---------

Co-authored-by: liunux4odoo <liunu@qq.com>
											
										
										
											2023-08-29 10:06:09 +08:00
+								        # "gpus": None, # 使用的GPU，以str的格式指定，如"0,1"
 								        # "num_gpus": 1, # 使用GPU的数量
-												update server_config.py.example: 增加多卡启动的说明

											
										
										
											2023-08-25 11:27:39 +08:00
+								        # "max_gpu_memory": "20GiB", # 每个GPU占用的最大显存
-												添加切换模型功能，支持智谱AI在线模型 (#1342)

* 添加LLM模型切换功能，需要在server_config中设置可切换的模型
* add tests for api.py/llm_model/*
* - 支持模型切换
- 支持智普AI线上模型
- startup.py增加参数`--api-worker`，自动运行所有的线上API模型。使用`-a
  (--all-webui), --all-api`时默认开启该选项
* 修复被fastchat覆盖的标准输出
* 对fastchat日志进行更细致的控制，startup.py中增加-q(--quiet)开关，可以减少无用的fastchat日志输出
* 修正chatglm api的对话模板


Co-authored-by: liunux4odoo <liunu@qq.com>
											
										
										
											2023-09-01 23:58:09 +08:00
 								        # 以下为非常用参数，可根据需要配置
-												update server_config.py.example: 增加多卡启动的说明

											
										
										
											2023-08-25 11:27:39 +08:00
+								        # "load_8bit": False, # 开启8bit量化
-												add startup.py: start specified servers with one command. see python startup.py --help

											
										
										
											2023-08-17 13:24:53 +08:00
+								        # "cpu_offloading": None,
 								        # "gptq_ckpt": None,
 								        # "gptq_wbits": 16,
 								        # "gptq_groupsize": -1,
 								        # "gptq_act_order": False,
 								        # "awq_ckpt": None,
 								        # "awq_wbits": 16,
 								        # "awq_groupsize": -1,
 								        # "model_names": [LLM_MODEL],
 								        # "conv_template": None,
 								        # "limit_worker_concurrency": 5,
 								        # "stream_interval": 2,
 								        # "no_register": False,
-												修复文心一言，添加测试用例

											
										
										
											2023-09-14 23:37:34 +08:00
+								        # "embed_in_truncate": False,
-												add startup.py: start specified servers with one command. see python startup.py --help

											
										
										
											2023-08-17 13:24:53 +08:00
+								    },
-												添加切换模型功能，支持智谱AI在线模型 (#1342)

* 添加LLM模型切换功能，需要在server_config中设置可切换的模型
* add tests for api.py/llm_model/*
* - 支持模型切换
- 支持智普AI线上模型
- startup.py增加参数`--api-worker`，自动运行所有的线上API模型。使用`-a
  (--all-webui), --all-api`时默认开启该选项
* 修复被fastchat覆盖的标准输出
* 对fastchat日志进行更细致的控制，startup.py中增加-q(--quiet)开关，可以减少无用的fastchat日志输出
* 修正chatglm api的对话模板


Co-authored-by: liunux4odoo <liunu@qq.com>
											
										
										
											2023-09-01 23:58:09 +08:00
+								    "baichuan-7b": { # 使用default中的IP和端口
 								        "device": "cpu",
 								    },
-												优化configs (#1474)

* remove llm_model_dict

* optimize configs

* fix get_model_path

* 更改一些默认参数，添加千帆的默认配置

* Update server_config.py.example
											
										
										
											2023-09-15 17:52:22 +08:00
+								    "zhipu-api": { # 请为每个要运行的在线API设置不同的端口
 								        "port": 21001,
-												添加切换模型功能，支持智谱AI在线模型 (#1342)

* 添加LLM模型切换功能，需要在server_config中设置可切换的模型
* add tests for api.py/llm_model/*
* - 支持模型切换
- 支持智普AI线上模型
- startup.py增加参数`--api-worker`，自动运行所有的线上API模型。使用`-a
  (--all-webui), --all-api`时默认开启该选项
* 修复被fastchat覆盖的标准输出
* 对fastchat日志进行更细致的控制，startup.py中增加-q(--quiet)开关，可以减少无用的fastchat日志输出
* 修正chatglm api的对话模板


Co-authored-by: liunux4odoo <liunu@qq.com>
											
										
										
											2023-09-01 23:58:09 +08:00
+								    },
-												优化configs (#1474)

* remove llm_model_dict

* optimize configs

* fix get_model_path

* 更改一些默认参数，添加千帆的默认配置

* Update server_config.py.example
											
										
										
											2023-09-15 17:52:22 +08:00
+								    "minimax-api": {
 								        "port": 21002,
-												添加MiniMax在线API支持 (#1445)


											
										
										
											2023-09-12 15:24:47 +08:00
+								    },
-												优化configs (#1474)

* remove llm_model_dict

* optimize configs

* fix get_model_path

* 更改一些默认参数，添加千帆的默认配置

* Update server_config.py.example
											
										
										
											2023-09-15 17:52:22 +08:00
+								    "xinghuo-api": {
 								        "port": 21003,
-												支持讯飞星火大模型在线API (#1460)

* 支持讯飞星火大模型在线API
											
										
										
											2023-09-13 13:51:05 +08:00
+								    },
-												修复文心一言，添加测试用例

											
										
										
											2023-09-14 23:37:34 +08:00
+								    "qianfan-api": {
-												优化configs (#1474)

* remove llm_model_dict

* optimize configs

* fix get_model_path

* 更改一些默认参数，添加千帆的默认配置

* Update server_config.py.example
											
										
										
											2023-09-15 17:52:22 +08:00
+								        "port": 21004,
-												修复文心一言，添加测试用例

											
										
										
											2023-09-14 23:37:34 +08:00
+								    },
-												add startup.py: start specified servers with one command. see python startup.py --help

											
										
										
											2023-08-17 13:24:53 +08:00
+								}
 								# fastchat multi model worker server
 								FSCHAT_MULTI_MODEL_WORKERS = {
-												添加切换模型功能，支持智谱AI在线模型 (#1342)

* 添加LLM模型切换功能，需要在server_config中设置可切换的模型
* add tests for api.py/llm_model/*
* - 支持模型切换
- 支持智普AI线上模型
- startup.py增加参数`--api-worker`，自动运行所有的线上API模型。使用`-a
  (--all-webui), --all-api`时默认开启该选项
* 修复被fastchat覆盖的标准输出
* 对fastchat日志进行更细致的控制，startup.py中增加-q(--quiet)开关，可以减少无用的fastchat日志输出
* 修正chatglm api的对话模板


Co-authored-by: liunux4odoo <liunu@qq.com>
											
										
										
											2023-09-01 23:58:09 +08:00
+								    # TODO:
-												add startup.py: start specified servers with one command. see python startup.py --help

											
										
										
											2023-08-17 13:24:53 +08:00
+								}
 								# fastchat controller server
 								FSCHAT_CONTROLLER = {
 								    "host": DEFAULT_BIND_HOST,
 								    "port": 20001,
 								    "dispatch_method": "shortest_queue",
 								}