Merge branch 'master' into pre-release
This commit is contained in:
commit
1d0c6a9184
|
|
@ -0,0 +1,22 @@
|
||||||
|
name: Close inactive issues
|
||||||
|
on:
|
||||||
|
schedule:
|
||||||
|
- cron: "30 1 * * *"
|
||||||
|
|
||||||
|
jobs:
|
||||||
|
close-issues:
|
||||||
|
runs-on: ubuntu-latest
|
||||||
|
permissions:
|
||||||
|
issues: write
|
||||||
|
pull-requests: write
|
||||||
|
steps:
|
||||||
|
- uses: actions/stale@v5
|
||||||
|
with:
|
||||||
|
days-before-issue-stale: 30
|
||||||
|
days-before-issue-close: 14
|
||||||
|
stale-issue-label: "stale"
|
||||||
|
stale-issue-message: "This issue is stale because it has been open for 30 days with no activity."
|
||||||
|
close-issue-message: "This issue was closed because it has been inactive for 14 days since being marked as stale."
|
||||||
|
days-before-pr-stale: -1
|
||||||
|
days-before-pr-close: -1
|
||||||
|
repo-token: ${{ secrets.GITHUB_TOKEN }}
|
||||||
|
|
@ -4,6 +4,6 @@ logs
|
||||||
.idea/
|
.idea/
|
||||||
__pycache__/
|
__pycache__/
|
||||||
/knowledge_base/
|
/knowledge_base/
|
||||||
configs/*.py
|
/configs/*.py
|
||||||
.vscode/
|
.vscode/
|
||||||
.pytest_cache/
|
.pytest_cache/
|
||||||
|
|
|
||||||
|
|
@ -485,6 +485,6 @@ $ streamlit run webui.py --server.port 666
|
||||||
|
|
||||||
## 项目交流群
|
## 项目交流群
|
||||||
|
|
||||||
<img src="img/qr_code_59.jpg" alt="二维码" width="300" height="300" />
|
<img src="img/qr_code_60.jpg" alt="二维码" width="300" height="300" />
|
||||||
|
|
||||||
🎉 langchain-ChatGLM 项目微信交流群,如果你也对本项目感兴趣,欢迎加入群聊参与讨论交流。
|
🎉 langchain-ChatGLM 项目微信交流群,如果你也对本项目感兴趣,欢迎加入群聊参与讨论交流。
|
||||||
|
|
|
||||||
|
|
@ -5,7 +5,7 @@ from langchain.document_loaders.unstructured import UnstructuredFileLoader
|
||||||
class RapidOCRPDFLoader(UnstructuredFileLoader):
|
class RapidOCRPDFLoader(UnstructuredFileLoader):
|
||||||
def _get_elements(self) -> List:
|
def _get_elements(self) -> List:
|
||||||
def pdf2text(filepath):
|
def pdf2text(filepath):
|
||||||
import fitz
|
import fitz # pyMuPDF里面的fitz包,不要与pip install fitz混淆
|
||||||
from rapidocr_onnxruntime import RapidOCR
|
from rapidocr_onnxruntime import RapidOCR
|
||||||
import numpy as np
|
import numpy as np
|
||||||
ocr = RapidOCR()
|
ocr = RapidOCR()
|
||||||
|
|
|
||||||
Binary file not shown.
|
After Width: | Height: | Size: 248 KiB |
|
|
@ -91,8 +91,8 @@ LOADER_DICT = {"UnstructuredHTMLLoader": ['.html'],
|
||||||
"RapidOCRLoader": ['.png', '.jpg', '.jpeg', '.bmp'],
|
"RapidOCRLoader": ['.png', '.jpg', '.jpeg', '.bmp'],
|
||||||
"UnstructuredFileLoader": ['.eml', '.msg', '.rst',
|
"UnstructuredFileLoader": ['.eml', '.msg', '.rst',
|
||||||
'.rtf', '.txt', '.xml',
|
'.rtf', '.txt', '.xml',
|
||||||
'.doc', '.docx', '.epub', '.odt',
|
'.docx', '.epub', '.odt',
|
||||||
'.ppt', '.pptx', '.tsv'], # '.xlsx'
|
'.ppt', '.pptx', '.tsv'],
|
||||||
}
|
}
|
||||||
SUPPORTED_EXTS = [ext for sublist in LOADER_DICT.values() for ext in sublist]
|
SUPPORTED_EXTS = [ext for sublist in LOADER_DICT.values() for ext in sublist]
|
||||||
|
|
||||||
|
|
|
||||||
|
|
@ -153,6 +153,7 @@ def dialogue_page(api: ApiRequest):
|
||||||
for d in api.knowledge_base_chat(prompt, selected_kb, kb_top_k, score_threshold, history, model=llm_model):
|
for d in api.knowledge_base_chat(prompt, selected_kb, kb_top_k, score_threshold, history, model=llm_model):
|
||||||
if error_msg := check_error_msg(d): # check whether error occured
|
if error_msg := check_error_msg(d): # check whether error occured
|
||||||
st.error(error_msg)
|
st.error(error_msg)
|
||||||
|
else:
|
||||||
text += d["answer"]
|
text += d["answer"]
|
||||||
chat_box.update_msg(text, 0)
|
chat_box.update_msg(text, 0)
|
||||||
chat_box.update_msg("\n\n".join(d["docs"]), 1, streaming=False)
|
chat_box.update_msg("\n\n".join(d["docs"]), 1, streaming=False)
|
||||||
|
|
|
||||||
Loading…
Reference in New Issue