2023-04-13 23:01:52 +08:00
|
|
|
import torch.cuda
|
|
|
|
|
import torch.backends
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
embedding_model_dict = {
|
|
|
|
|
"ernie-tiny": "nghuyong/ernie-3.0-nano-zh",
|
|
|
|
|
"ernie-base": "nghuyong/ernie-3.0-base-zh",
|
|
|
|
|
"text2vec": "GanymedeNil/text2vec-large-chinese",
|
2023-04-18 09:30:49 +08:00
|
|
|
"local-text2vec": "./embedding/text2vec-large-chinese"
|
2023-04-13 23:01:52 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
# Embedding model name
|
2023-04-18 09:30:49 +08:00
|
|
|
EMBEDDING_MODEL = "local-text2vec"
|
2023-04-13 23:01:52 +08:00
|
|
|
|
|
|
|
|
# Embedding running device
|
|
|
|
|
EMBEDDING_DEVICE = "cuda" if torch.cuda.is_available() else "mps" if torch.backends.mps.is_available() else "cpu"
|
|
|
|
|
|
|
|
|
|
# supported LLM models
|
|
|
|
|
llm_model_dict = {
|
|
|
|
|
"chatglm-6b-int4-qe": "THUDM/chatglm-6b-int4-qe",
|
|
|
|
|
"chatglm-6b-int4": "THUDM/chatglm-6b-int4",
|
|
|
|
|
"chatglm-6b": "THUDM/chatglm-6b",
|
2023-04-18 09:30:49 +08:00
|
|
|
"local-chatglm-6b": "./llm/chatglm-6b"
|
2023-04-13 23:01:52 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
# LLM model name
|
2023-04-18 09:30:49 +08:00
|
|
|
LLM_MODEL = "local-chatglm-6b"
|
2023-04-13 23:01:52 +08:00
|
|
|
|
2023-04-15 14:43:12 +08:00
|
|
|
# Use p-tuning-v2 PrefixEncoder
|
|
|
|
|
USE_PTUNING_V2 = False
|
|
|
|
|
|
2023-04-13 23:01:52 +08:00
|
|
|
# LLM running device
|
|
|
|
|
LLM_DEVICE = "cuda" if torch.cuda.is_available() else "mps" if torch.backends.mps.is_available() else "cpu"
|
|
|
|
|
|