Skip to content

Commit

Permalink
Merge pull request #1 from Oscilloscope98/mtl-first-migration
Browse files Browse the repository at this point in the history
MTL first migration with bigdl-llm model worker for native Windows (only LLM on XPU)
  • Loading branch information
Oscilloscope98 authored Mar 14, 2024
2 parents d879e86 + de4ff2b commit 51edafe
Show file tree
Hide file tree
Showing 55 changed files with 199 additions and 2,468 deletions.
7 changes: 4 additions & 3 deletions configs/model_config.py.example
Original file line number Diff line number Diff line change
Expand Up @@ -9,7 +9,7 @@ MODEL_ROOT_PATH = ""
EMBEDDING_MODEL = "bge-large-zh-v1.5"

# Embedding 模型运行设备。设为 "auto" 会自动检测(会有警告),也可手动设定为 "cuda","mps","cpu","xpu" 其中之一。
EMBEDDING_DEVICE = "auto"
EMBEDDING_DEVICE = "cpu"

# 选用的reranker模型
RERANKER_MODEL = "bge-reranker-large"
Expand All @@ -26,11 +26,12 @@ EMBEDDING_MODEL_OUTPUT_PATH = "output"
# 在这里,我们使用目前主流的两个离线模型,其中,chatglm3-6b 为默认加载模型。
# 如果你的显存不足,可使用 Qwen-1_8B-Chat, 该模型 FP16 仅需 3.8G显存。

LLM_MODELS = ["chatglm3-6b", "zhipu-api", "openai-api"]
# LLM_MODELS = ["chatglm3-6b", "zhipu-api", "openai-api"]
LLM_MODELS = ["chatglm3-6b"]
Agent_MODEL = None

# LLM 模型运行设备。设为"auto"会自动检测(会有警告),也可手动设定为 "cuda","mps","cpu","xpu" 其中之一。
LLM_DEVICE = "auto"
LLM_DEVICE = "xpu"

HISTORY_LEN = 3

Expand Down
4 changes: 2 additions & 2 deletions configs/server_config.py.example
Original file line number Diff line number Diff line change
Expand Up @@ -91,10 +91,10 @@ FSCHAT_MODEL_WORKERS = {

},
"chatglm3-6b": {
"device": "cuda",
"device": "xpu",
},
"Qwen1.5-0.5B-Chat": {
"device": "cuda",
"device": "xpu",
},
# 以下配置可以不用修改,在model_config中设置启动的模型
"zhipu-api": {
Expand Down
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Diff not rendered.
Diff not rendered.
Diff not rendered.
Diff not rendered.
Diff not rendered.
Diff not rendered.
Diff not rendered.
Diff not rendered.
74 changes: 0 additions & 74 deletions knowledge_base/samples/content/llm/分布式训练技术原理.md

This file was deleted.

97 changes: 0 additions & 97 deletions knowledge_base/samples/content/llm/大模型应用技术原理.md

This file was deleted.

This file was deleted.

Loading

0 comments on commit 51edafe

Please sign in to comment.