Langchain-Chatchat/server/api.py

import nltk
import sys
import os

sys.path.append(os.path.dirname(os.path.dirname(__file__)))

from configs.model_config import LLM_MODEL, NLTK_DATA_PATH
from configs.server_config import OPEN_CROSS_DOMAIN, HTTPX_DEFAULT_TIMEOUT
from configs import VERSION
import argparse
import uvicorn
from fastapi import Body
from fastapi.middleware.cors import CORSMiddleware
from starlette.responses import RedirectResponse
from server.chat import (chat, knowledge_base_chat, openai_chat,
                         search_engine_chat)
from server.knowledge_base.kb_api import list_kbs, create_kb, delete_kb
from server.knowledge_base.kb_doc_api import (list_files, upload_doc, delete_doc,
                                              update_doc, download_doc, recreate_vector_store,
                                              search_docs, DocumentWithScore)
from server.utils import BaseResponse, ListResponse, FastAPI, MakeFastAPIOffline, fschat_controller_address
import httpx
from typing import List

nltk.data.path = [NLTK_DATA_PATH] + nltk.data.path


async def document():
    return RedirectResponse(url="/docs")


def create_app():
    app = FastAPI(
        title="Langchain-Chatchat API Server",
        version=VERSION
    )
    MakeFastAPIOffline(app)
    # Add CORS middleware to allow all origins
    # 在config.py中设置OPEN_DOMAIN=True，允许跨域
    # set OPEN_DOMAIN=True in config.py to allow cross-domain
    if OPEN_CROSS_DOMAIN:
        app.add_middleware(
            CORSMiddleware,
            allow_origins=["*"],
            allow_credentials=True,
            allow_methods=["*"],
            allow_headers=["*"],
        )

    app.get("/",
            response_model=BaseResponse,
            summary="swagger 文档")(document)

    # Tag: Chat
    app.post("/chat/fastchat",
             tags=["Chat"],
             summary="与llm模型对话(直接与fastchat api对话)")(openai_chat)

    app.post("/chat/chat",
             tags=["Chat"],
             summary="与llm模型对话(通过LLMChain)")(chat)

    app.post("/chat/knowledge_base_chat",
             tags=["Chat"],
             summary="与知识库对话")(knowledge_base_chat)

    app.post("/chat/search_engine_chat",
             tags=["Chat"],
             summary="与搜索引擎对话")(search_engine_chat)

    # Tag: Knowledge Base Management
    app.get("/knowledge_base/list_knowledge_bases",
            tags=["Knowledge Base Management"],
            response_model=ListResponse,
            summary="获取知识库列表")(list_kbs)

    app.post("/knowledge_base/create_knowledge_base",
             tags=["Knowledge Base Management"],
             response_model=BaseResponse,
             summary="创建知识库"
             )(create_kb)

    app.post("/knowledge_base/delete_knowledge_base",
             tags=["Knowledge Base Management"],
             response_model=BaseResponse,
             summary="删除知识库"
             )(delete_kb)

    app.get("/knowledge_base/list_files",
            tags=["Knowledge Base Management"],
            response_model=ListResponse,
            summary="获取知识库内的文件列表"
            )(list_files)

    app.post("/knowledge_base/search_docs",
             tags=["Knowledge Base Management"],
             response_model=List[DocumentWithScore],
             summary="搜索知识库"
             )(search_docs)

    app.post("/knowledge_base/upload_doc",
             tags=["Knowledge Base Management"],
             response_model=BaseResponse,
             summary="上传文件到知识库"
             )(upload_doc)

    app.post("/knowledge_base/delete_doc",
             tags=["Knowledge Base Management"],
             response_model=BaseResponse,
             summary="删除知识库内指定文件"
             )(delete_doc)

    app.post("/knowledge_base/update_doc",
             tags=["Knowledge Base Management"],
             response_model=BaseResponse,
             summary="更新现有文件到知识库"
             )(update_doc)

    app.get("/knowledge_base/download_doc",
            tags=["Knowledge Base Management"],
            summary="下载对应的知识文件")(download_doc)

    app.post("/knowledge_base/recreate_vector_store",
             tags=["Knowledge Base Management"],
             summary="根据content中文档重建向量库，流式输出处理进度。"
             )(recreate_vector_store)

    # LLM模型相关接口
    @app.post("/llm_model/list_models",
            tags=["LLM Model Management"],
            summary="列出当前已加载的模型")
    def list_models(
        controller_address: str = Body(None, description="Fastchat controller服务器地址", examples=[fschat_controller_address()])
    ) -> BaseResponse:
        '''
        从fastchat controller获取已加载模型列表
        '''
        try:
            controller_address = controller_address or fschat_controller_address()
            r = httpx.post(controller_address + "/list_models")
            return BaseResponse(data=r.json()["models"])
        except Exception as e:
            return BaseResponse(
                code=500,
                data=[],
                msg=f"failed to get available models from controller: {controller_address}。错误信息是： {e}")

    @app.post("/llm_model/stop",
            tags=["LLM Model Management"],
            summary="停止指定的LLM模型（Model Worker)",
            )
    def stop_llm_model(
        model_name: str = Body(..., description="要停止的LLM模型名称", examples=[LLM_MODEL]),
        controller_address: str = Body(None, description="Fastchat controller服务器地址", examples=[fschat_controller_address()])
    ) -> BaseResponse:
        '''
        向fastchat controller请求停止某个LLM模型。
        注意：由于Fastchat的实现方式，实际上是把LLM模型所在的model_worker停掉。
        '''
        try:
            controller_address = controller_address or fschat_controller_address()
            r = httpx.post(
                controller_address + "/release_worker",
                json={"model_name": model_name},
            )
            return r.json()
        except Exception as e:
            return BaseResponse(
                code=500,
                msg=f"failed to stop LLM model {model_name} from controller: {controller_address}。错误信息是： {e}")

    @app.post("/llm_model/change",
            tags=["LLM Model Management"],
            summary="切换指定的LLM模型（Model Worker)",
            )
    def change_llm_model(
        model_name: str = Body(..., description="当前运行模型", examples=[LLM_MODEL]),
        new_model_name: str = Body(..., description="要切换的新模型", examples=[LLM_MODEL]),
        controller_address: str = Body(None, description="Fastchat controller服务器地址", examples=[fschat_controller_address()])
    ):
        '''
        向fastchat controller请求切换LLM模型。
        '''
        try:
            controller_address = controller_address or fschat_controller_address()
            r = httpx.post(
                controller_address + "/release_worker",
                json={"model_name": model_name, "new_model_name": new_model_name},
                timeout=HTTPX_DEFAULT_TIMEOUT, # wait for new worker_model
            )
            return r.json()
        except Exception as e:
            return BaseResponse(
                code=500,
                msg=f"failed to switch LLM model from controller: {controller_address}。错误信息是： {e}")

    return app


app = create_app()


def run_api(host, port, **kwargs):
    if kwargs.get("ssl_keyfile") and kwargs.get("ssl_certfile"):
        uvicorn.run(app,
                    host=host,
                    port=port,
                    ssl_keyfile=kwargs.get("ssl_keyfile"),
                    ssl_certfile=kwargs.get("ssl_certfile"),
                    )
    else:
        uvicorn.run(app, host=host, port=port)


if __name__ == "__main__":
    parser = argparse.ArgumentParser(prog='langchain-ChatGLM',
                                     description='About langchain-ChatGLM, local knowledge based ChatGLM with langchain'
                                                 ' ｜ 基于本地知识库的 ChatGLM 问答')
    parser.add_argument("--host", type=str, default="0.0.0.0")
    parser.add_argument("--port", type=int, default=7861)
    parser.add_argument("--ssl_keyfile", type=str)
    parser.add_argument("--ssl_certfile", type=str)
    # 初始化消息
    args = parser.parse_args()
    args_dict = vars(args)
    run_api(host=args.host,
            port=args.port,
            ssl_keyfile=args.ssl_keyfile,
            ssl_certfile=args.ssl_certfile,
            )
-												v0.2.0 first commit

											
										
										
											2023-07-27 23:22:07 +08:00
+								import nltk
-												make api.py import model_config coreectlly

											
										
										
											2023-07-29 23:00:50 +08:00
+								import sys
 								import os
-												update import pkgs and format

											
										
										
											2023-08-10 21:26:05 +08:00
-												make api.py import model_config coreectlly

											
										
										
											2023-07-29 23:00:50 +08:00
+								sys.path.append(os.path.dirname(os.path.dirname(__file__)))
-												change kb_api functions with KnowledgeBase class method

											
										
										
											2023-08-05 03:15:41 +08:00
-												添加切换模型功能，支持智谱AI在线模型 (#1342)

* 添加LLM模型切换功能，需要在server_config中设置可切换的模型
* add tests for api.py/llm_model/*
* - 支持模型切换
- 支持智普AI线上模型
- startup.py增加参数`--api-worker`，自动运行所有的线上API模型。使用`-a
  (--all-webui), --all-api`时默认开启该选项
* 修复被fastchat覆盖的标准输出
* 对fastchat日志进行更细致的控制，startup.py中增加-q(--quiet)开关，可以减少无用的fastchat日志输出
* 修正chatglm api的对话模板


Co-authored-by: liunux4odoo <liunu@qq.com>
											
										
										
											2023-09-01 23:58:09 +08:00
+								from configs.model_config import LLM_MODEL, NLTK_DATA_PATH
 								from configs.server_config import OPEN_CROSS_DOMAIN, HTTPX_DEFAULT_TIMEOUT
-												update configs.__init__, webui.py and api.py

											
										
										
											2023-08-17 22:19:26 +08:00
+								from configs import VERSION
-												v0.2.0 first commit

											
										
										
											2023-07-27 23:22:07 +08:00
+								import argparse
 								import uvicorn
-												添加切换模型功能，支持智谱AI在线模型 (#1342)

* 添加LLM模型切换功能，需要在server_config中设置可切换的模型
* add tests for api.py/llm_model/*
* - 支持模型切换
- 支持智普AI线上模型
- startup.py增加参数`--api-worker`，自动运行所有的线上API模型。使用`-a
  (--all-webui), --all-api`时默认开启该选项
* 修复被fastchat覆盖的标准输出
* 对fastchat日志进行更细致的控制，startup.py中增加-q(--quiet)开关，可以减少无用的fastchat日志输出
* 修正chatglm api的对话模板


Co-authored-by: liunux4odoo <liunu@qq.com>
											
										
										
											2023-09-01 23:58:09 +08:00
+								from fastapi import Body
-												v0.2.0 first commit

											
										
										
											2023-07-27 23:22:07 +08:00
+								from fastapi.middleware.cors import CORSMiddleware
-												add bing_search_chat.py and duckduckgo_search_chat.py

											
										
										
											2023-08-01 16:39:17 +08:00
+								from starlette.responses import RedirectResponse
 								from server.chat import (chat, knowledge_base_chat, openai_chat,
-. change bing_search_chat and duckduckgo_search_chat into search_engine_chat
2. add knowledge_base not found to knowledge_base_chat and add search_engine not found to search_engine_chat

											
										
										
											2023-08-03 18:22:36 +08:00
+								                         search_engine_chat)
-												update knowledge base kbservice and api:
1. make huggingfaceembeddings hashable
2. unify embeddings' loading method for all kbservie
3. make ApiRequest skip empty content when streaming json to avoid dict
   KeyError

											
										
										
											2023-08-09 10:46:01 +08:00
+								from server.knowledge_base.kb_api import list_kbs, create_kb, delete_kb
-												增加数据库字段，重建知识库使用多线程 (#1280)

* close #1172: 给webui_page/utils添加一些log信息，方便定位错误

* 修复：重建知识库时页面未实时显示进度

* skip model_worker running when using online model api such as chatgpt

* 修改知识库管理相关内容:
1.KnowledgeFileModel增加3个字段：file_mtime(文件修改时间),file_size(文件大小),custom_docs(是否使用自定义docs)。为后面比对上传文件做准备。
2.给所有String字段加上长度，防止mysql建表错误(pr#1177)
3.统一[faiss/milvus/pgvector]_kb_service.add_doc接口，使其支持自定义docs
4.为faiss_kb_service增加一些方法，便于调用
5.为KnowledgeFile增加一些方法，便于获取文件信息，缓存file2text的结果。

* 修复/chat/fastchat无法流式输出的问题

* 新增功能：
1、KnowledgeFileModel增加"docs_count"字段，代表该文件加载到向量库中的Document数量，并在WEBUI中进行展示。
2、重建知识库`python init_database.py --recreate-vs`支持多线程。

其它：
统一代码中知识库相关函数用词：file代表一个文件名称或路径，doc代表langchain加载后的Document。部分与API接口有关或含义重叠的函数暂未修改。

---------

Co-authored-by: liunux4odoo <liunux@qq.com>, hongkong9771 
											
										
										
											2023-08-28 13:50:35 +08:00
+								from server.knowledge_base.kb_doc_api import (list_files, upload_doc, delete_doc,
-												update api and webui:
1. 增加search_docs接口，返回原始知识库检索文档，close #1103
2. 为FAISS检索增加score_threshold参数。milvus和PG暂不支持

											
										
										
											2023-08-16 13:18:58 +08:00
+								                                              update_doc, download_doc, recreate_vector_store,
-												update configs.__init__, webui.py and api.py

											
										
										
											2023-08-17 22:19:26 +08:00
+								                                              search_docs, DocumentWithScore)
-												添加切换模型功能，支持智谱AI在线模型 (#1342)

* 添加LLM模型切换功能，需要在server_config中设置可切换的模型
* add tests for api.py/llm_model/*
* - 支持模型切换
- 支持智普AI线上模型
- startup.py增加参数`--api-worker`，自动运行所有的线上API模型。使用`-a
  (--all-webui), --all-api`时默认开启该选项
* 修复被fastchat覆盖的标准输出
* 对fastchat日志进行更细致的控制，startup.py中增加-q(--quiet)开关，可以减少无用的fastchat日志输出
* 修正chatglm api的对话模板


Co-authored-by: liunux4odoo <liunu@qq.com>
											
										
										
											2023-09-01 23:58:09 +08:00
+								from server.utils import BaseResponse, ListResponse, FastAPI, MakeFastAPIOffline, fschat_controller_address
 								import httpx
-												update api and webui:
1. 增加search_docs接口，返回原始知识库检索文档，close #1103
2. 为FAISS检索增加score_threshold参数。milvus和PG暂不支持

											
										
										
											2023-08-16 13:18:58 +08:00
+								from typing import List
-												v0.2.0 first commit

											
										
										
											2023-07-27 23:22:07 +08:00
+								nltk.data.path = [NLTK_DATA_PATH] + nltk.data.path
 								async def document():
 								    return RedirectResponse(url="/docs")
-												split api_start to create_app & run_api. user can run api with uvicorn in console: uvicorn server.api:app --port 7861

											
										
										
											2023-07-31 10:05:19 +08:00
+								def create_app():
-												update configs.__init__, webui.py and api.py

											
										
										
											2023-08-17 22:19:26 +08:00
+								    app = FastAPI(
 								        title="Langchain-Chatchat API Server",
 								        version=VERSION
 								    )
-												update llm_api and api server:
1. fastchat's controller/model_worker/api_server use swagger UI offline.
2. add custom title and icon.
3. remove fastapi-offline dependence

											
										
										
											2023-08-16 14:20:09 +08:00
+								    MakeFastAPIOffline(app)
-												v0.2.0 first commit

											
										
										
											2023-07-27 23:22:07 +08:00
+								    # Add CORS middleware to allow all origins
 								    # 在config.py中设置OPEN_DOMAIN=True，允许跨域
 								    # set OPEN_DOMAIN=True in config.py to allow cross-domain
 								    if OPEN_CROSS_DOMAIN:
 								        app.add_middleware(
 								            CORSMiddleware,
 								            allow_origins=["*"],
 								            allow_credentials=True,
 								            allow_methods=["*"],
 								            allow_headers=["*"],
 								        )
 								    app.get("/",
 								            response_model=BaseResponse,
 								            summary="swagger 文档")(document)
-. change bing_search_chat and duckduckgo_search_chat into search_engine_chat
2. add knowledge_base not found to knowledge_base_chat and add search_engine not found to search_engine_chat

											
										
										
											2023-08-03 18:22:36 +08:00
+								    # Tag: Chat
-												v0.2.0 first commit

											
										
										
											2023-07-27 23:22:07 +08:00
+								    app.post("/chat/fastchat",
 								             tags=["Chat"],
 								             summary="与llm模型对话(直接与fastchat api对话)")(openai_chat)
 								    app.post("/chat/chat",
 								             tags=["Chat"],
 								             summary="与llm模型对话(通过LLMChain)")(chat)
 								    app.post("/chat/knowledge_base_chat",
 								             tags=["Chat"],
 								             summary="与知识库对话")(knowledge_base_chat)
-. change bing_search_chat and duckduckgo_search_chat into search_engine_chat
2. add knowledge_base not found to knowledge_base_chat and add search_engine not found to search_engine_chat

											
										
										
											2023-08-03 18:22:36 +08:00
+								    app.post("/chat/search_engine_chat",
-												add bing_search_chat.py and duckduckgo_search_chat.py

											
										
										
											2023-08-01 16:39:17 +08:00
+								             tags=["Chat"],
-. change bing_search_chat and duckduckgo_search_chat into search_engine_chat
2. add knowledge_base not found to knowledge_base_chat and add search_engine not found to search_engine_chat

											
										
										
											2023-08-03 18:22:36 +08:00
+								             summary="与搜索引擎对话")(search_engine_chat)
-												v0.2.0 first commit

											
										
										
											2023-07-27 23:22:07 +08:00
-												add history to chat apis

											
										
										
											2023-08-08 23:55:27 +08:00
+								    # Tag: Knowledge Base Management
 								    app.get("/knowledge_base/list_knowledge_bases",
 								            tags=["Knowledge Base Management"],
 								            response_model=ListResponse,
 								            summary="获取知识库列表")(list_kbs)
 								    app.post("/knowledge_base/create_knowledge_base",
 								             tags=["Knowledge Base Management"],
 								             response_model=BaseResponse,
 								             summary="创建知识库"
 								             )(create_kb)
-												更新API与ApiReuest：
1. 重新整理webui_pages/utils与server/knowledge_base间的工具依赖
2.
将delete_knowledge_base与delete_doc接口从delete改为post.delete不支持body参数
3. 修复update_doc
4. 修复部分bug

											
										
										
											2023-08-11 08:37:07 +08:00
+								    app.post("/knowledge_base/delete_knowledge_base",
-												update configs.__init__, webui.py and api.py

											
										
										
											2023-08-17 22:19:26 +08:00
+								             tags=["Knowledge Base Management"],
 								             response_model=BaseResponse,
 								             summary="删除知识库"
 								             )(delete_kb)
-												add history to chat apis

											
										
										
											2023-08-08 23:55:27 +08:00
-												增加数据库字段，重建知识库使用多线程 (#1280)

* close #1172: 给webui_page/utils添加一些log信息，方便定位错误

* 修复：重建知识库时页面未实时显示进度

* skip model_worker running when using online model api such as chatgpt

* 修改知识库管理相关内容:
1.KnowledgeFileModel增加3个字段：file_mtime(文件修改时间),file_size(文件大小),custom_docs(是否使用自定义docs)。为后面比对上传文件做准备。
2.给所有String字段加上长度，防止mysql建表错误(pr#1177)
3.统一[faiss/milvus/pgvector]_kb_service.add_doc接口，使其支持自定义docs
4.为faiss_kb_service增加一些方法，便于调用
5.为KnowledgeFile增加一些方法，便于获取文件信息，缓存file2text的结果。

* 修复/chat/fastchat无法流式输出的问题

* 新增功能：
1、KnowledgeFileModel增加"docs_count"字段，代表该文件加载到向量库中的Document数量，并在WEBUI中进行展示。
2、重建知识库`python init_database.py --recreate-vs`支持多线程。

其它：
统一代码中知识库相关函数用词：file代表一个文件名称或路径，doc代表langchain加载后的Document。部分与API接口有关或含义重叠的函数暂未修改。

---------

Co-authored-by: liunux4odoo <liunux@qq.com>, hongkong9771 
											
										
										
											2023-08-28 13:50:35 +08:00
+								    app.get("/knowledge_base/list_files",
-												add history to chat apis

											
										
										
											2023-08-08 23:55:27 +08:00
+								            tags=["Knowledge Base Management"],
 								            response_model=ListResponse,
 								            summary="获取知识库内的文件列表"
-												增加数据库字段，重建知识库使用多线程 (#1280)

* close #1172: 给webui_page/utils添加一些log信息，方便定位错误

* 修复：重建知识库时页面未实时显示进度

* skip model_worker running when using online model api such as chatgpt

* 修改知识库管理相关内容:
1.KnowledgeFileModel增加3个字段：file_mtime(文件修改时间),file_size(文件大小),custom_docs(是否使用自定义docs)。为后面比对上传文件做准备。
2.给所有String字段加上长度，防止mysql建表错误(pr#1177)
3.统一[faiss/milvus/pgvector]_kb_service.add_doc接口，使其支持自定义docs
4.为faiss_kb_service增加一些方法，便于调用
5.为KnowledgeFile增加一些方法，便于获取文件信息，缓存file2text的结果。

* 修复/chat/fastchat无法流式输出的问题

* 新增功能：
1、KnowledgeFileModel增加"docs_count"字段，代表该文件加载到向量库中的Document数量，并在WEBUI中进行展示。
2、重建知识库`python init_database.py --recreate-vs`支持多线程。

其它：
统一代码中知识库相关函数用词：file代表一个文件名称或路径，doc代表langchain加载后的Document。部分与API接口有关或含义重叠的函数暂未修改。

---------

Co-authored-by: liunux4odoo <liunux@qq.com>, hongkong9771 
											
										
										
											2023-08-28 13:50:35 +08:00
+								            )(list_files)
-												add history to chat apis

											
										
										
											2023-08-08 23:55:27 +08:00
-												update api and webui:
1. 增加search_docs接口，返回原始知识库检索文档，close #1103
2. 为FAISS检索增加score_threshold参数。milvus和PG暂不支持

											
										
										
											2023-08-16 13:18:58 +08:00
+								    app.post("/knowledge_base/search_docs",
-												update configs.__init__, webui.py and api.py

											
										
										
											2023-08-17 22:19:26 +08:00
+								             tags=["Knowledge Base Management"],
 								             response_model=List[DocumentWithScore],
 								             summary="搜索知识库"
 								             )(search_docs)
-												update api and webui:
1. 增加search_docs接口，返回原始知识库检索文档，close #1103
2. 为FAISS检索增加score_threshold参数。milvus和PG暂不支持

											
										
										
											2023-08-16 13:18:58 +08:00
-												add history to chat apis

											
										
										
											2023-08-08 23:55:27 +08:00
+								    app.post("/knowledge_base/upload_doc",
 								             tags=["Knowledge Base Management"],
 								             response_model=BaseResponse,
 								             summary="上传文件到知识库"
 								             )(upload_doc)
-												更新API与ApiReuest：
1. 重新整理webui_pages/utils与server/knowledge_base间的工具依赖
2.
将delete_knowledge_base与delete_doc接口从delete改为post.delete不支持body参数
3. 修复update_doc
4. 修复部分bug

											
										
										
											2023-08-11 08:37:07 +08:00
+								    app.post("/knowledge_base/delete_doc",
-												update configs.__init__, webui.py and api.py

											
										
										
											2023-08-17 22:19:26 +08:00
+								             tags=["Knowledge Base Management"],
 								             response_model=BaseResponse,
 								             summary="删除知识库内指定文件"
 								             )(delete_doc)
-												add history to chat apis

											
										
										
											2023-08-08 23:55:27 +08:00
-												update api/kb_doc_api and knowledge base management ui:
1. add update_doc to api which can udpate vector store from existed
   content file
2. add parameter `delete_content` to delete_doc api. user can decide
   whether delete local content file when delete doc.
3. fix bug in ApiReqeust.upload_doc
4. support listing docs existed in local folder bu not in db

											
										
										
											2023-08-09 16:52:04 +08:00
+								    app.post("/knowledge_base/update_doc",
 								             tags=["Knowledge Base Management"],
 								             response_model=BaseResponse,
 								             summary="更新现有文件到知识库"
 								             )(update_doc)
-												add history to chat apis

											
										
										
											2023-08-08 23:55:27 +08:00
-												update api and webui:
1. add download_doc to api
2. return local path or http url in kowledge_base_chat depends on
   no_remote_api
3. change assistant avater in webui

											
										
										
											2023-08-14 11:46:36 +08:00
+								    app.get("/knowledge_base/download_doc",
 								            tags=["Knowledge Base Management"],
 								            summary="下载对应的知识文件")(download_doc)
-												add history to chat apis

											
										
										
											2023-08-08 23:55:27 +08:00
+								    app.post("/knowledge_base/recreate_vector_store",
 								             tags=["Knowledge Base Management"],
 								             summary="根据content中文档重建向量库，流式输出处理进度。"
 								             )(recreate_vector_store)
-												automatically init vector store info to database when run api.py & webui.py

											
										
										
											2023-08-10 14:12:02 +08:00
-												添加切换模型功能，支持智谱AI在线模型 (#1342)

* 添加LLM模型切换功能，需要在server_config中设置可切换的模型
* add tests for api.py/llm_model/*
* - 支持模型切换
- 支持智普AI线上模型
- startup.py增加参数`--api-worker`，自动运行所有的线上API模型。使用`-a
  (--all-webui), --all-api`时默认开启该选项
* 修复被fastchat覆盖的标准输出
* 对fastchat日志进行更细致的控制，startup.py中增加-q(--quiet)开关，可以减少无用的fastchat日志输出
* 修正chatglm api的对话模板


Co-authored-by: liunux4odoo <liunu@qq.com>
											
										
										
											2023-09-01 23:58:09 +08:00
+								    # LLM模型相关接口
 								    @app.post("/llm_model/list_models",
 								            tags=["LLM Model Management"],
 								            summary="列出当前已加载的模型")
 								    def list_models(
 								        controller_address: str = Body(None, description="Fastchat controller服务器地址", examples=[fschat_controller_address()])
 								    ) -> BaseResponse:
 								        '''
 								        从fastchat controller获取已加载模型列表
 								        '''
 								        try:
 								            controller_address = controller_address or fschat_controller_address()
 								            r = httpx.post(controller_address + "/list_models")
 								            return BaseResponse(data=r.json()["models"])
 								        except Exception as e:
 								            return BaseResponse(
 								                code=500,
 								                data=[],
 								                msg=f"failed to get available models from controller: {controller_address}。错误信息是： {e}")
 								    @app.post("/llm_model/stop",
 								            tags=["LLM Model Management"],
 								            summary="停止指定的LLM模型（Model Worker)",
 								            )
 								    def stop_llm_model(
 								        model_name: str = Body(..., description="要停止的LLM模型名称", examples=[LLM_MODEL]),
 								        controller_address: str = Body(None, description="Fastchat controller服务器地址", examples=[fschat_controller_address()])
 								    ) -> BaseResponse:
 								        '''
 								        向fastchat controller请求停止某个LLM模型。
 								        注意：由于Fastchat的实现方式，实际上是把LLM模型所在的model_worker停掉。
 								        '''
 								        try:
 								            controller_address = controller_address or fschat_controller_address()
 								            r = httpx.post(
 								                controller_address + "/release_worker",
 								                json={"model_name": model_name},
 								            )
 								            return r.json()
 								        except Exception as e:
 								            return BaseResponse(
 								                code=500,
 								                msg=f"failed to stop LLM model {model_name} from controller: {controller_address}。错误信息是： {e}")
 								    @app.post("/llm_model/change",
 								            tags=["LLM Model Management"],
 								            summary="切换指定的LLM模型（Model Worker)",
 								            )
 								    def change_llm_model(
 								        model_name: str = Body(..., description="当前运行模型", examples=[LLM_MODEL]),
 								        new_model_name: str = Body(..., description="要切换的新模型", examples=[LLM_MODEL]),
 								        controller_address: str = Body(None, description="Fastchat controller服务器地址", examples=[fschat_controller_address()])
 								    ):
 								        '''
 								        向fastchat controller请求切换LLM模型。
 								        '''
 								        try:
 								            controller_address = controller_address or fschat_controller_address()
 								            r = httpx.post(
 								                controller_address + "/release_worker",
 								                json={"model_name": model_name, "new_model_name": new_model_name},
 								                timeout=HTTPX_DEFAULT_TIMEOUT, # wait for new worker_model
 								            )
 								            return r.json()
 								        except Exception as e:
 								            return BaseResponse(
 								                code=500,
 								                msg=f"failed to switch LLM model from controller: {controller_address}。错误信息是： {e}")
-												split api_start to create_app & run_api. user can run api with uvicorn in console: uvicorn server.api:app --port 7861

											
										
										
											2023-07-31 10:05:19 +08:00
+								    return app
-												change kb_api functions with KnowledgeBase class method

											
										
										
											2023-08-05 03:15:41 +08:00
-												split api_start to create_app & run_api. user can run api with uvicorn in console: uvicorn server.api:app --port 7861

											
										
										
											2023-07-31 10:05:19 +08:00
+								app = create_app()
-												v0.2.0 first commit

											
										
										
											2023-07-27 23:22:07 +08:00
-												change kb_api functions with KnowledgeBase class method

											
										
										
											2023-08-05 03:15:41 +08:00
-												split api_start to create_app & run_api. user can run api with uvicorn in console: uvicorn server.api:app --port 7861

											
										
										
											2023-07-31 10:05:19 +08:00
+								def run_api(host, port, **kwargs):
-												v0.2.0 first commit

											
										
										
											2023-07-27 23:22:07 +08:00
+								    if kwargs.get("ssl_keyfile") and kwargs.get("ssl_certfile"):
-												update format in api.py

											
										
										
											2023-08-01 21:53:19 +08:00
+								        uvicorn.run(app,
 								                    host=host,
 								                    port=port,
 								                    ssl_keyfile=kwargs.get("ssl_keyfile"),
 								                    ssl_certfile=kwargs.get("ssl_certfile"),
 								                    )
-												v0.2.0 first commit

											
										
										
											2023-07-27 23:22:07 +08:00
+								    else:
 								        uvicorn.run(app, host=host, port=port)
 								if __name__ == "__main__":
 								    parser = argparse.ArgumentParser(prog='langchain-ChatGLM',
 								                                     description='About langchain-ChatGLM, local knowledge based ChatGLM with langchain'
 								                                                 ' ｜ 基于本地知识库的 ChatGLM 问答')
 								    parser.add_argument("--host", type=str, default="0.0.0.0")
 								    parser.add_argument("--port", type=int, default=7861)
 								    parser.add_argument("--ssl_keyfile", type=str)
 								    parser.add_argument("--ssl_certfile", type=str)
 								    # 初始化消息
 								    args = parser.parse_args()
 								    args_dict = vars(args)
-												update format in api.py

											
										
										
											2023-08-01 21:53:19 +08:00
+								    run_api(host=args.host,
 								            port=args.port,
 								            ssl_keyfile=args.ssl_keyfile,
 								            ssl_certfile=args.ssl_certfile,
 								            )