chatchat-space · Dbassqwer · Apr 30, 2024 · lededev · May 5, 2024 · hongru-yu
diff --git a/server/knowledge_base/kb_cache/base.py b/server/knowledge_base/kb_cache/base.py
@@ -150,6 +150,9 @@ def load_embeddings(self, model: str = None, device: str = None) -> Embeddings:
                         embeddings.query_instruction = ""
                 else:
                     from langchain.embeddings.huggingface import HuggingFaceEmbeddings
+                    if device == "npu":
+                        import torch_npu
+                        torch_npu.npu.set_device("npu:0")
                     embeddings = HuggingFaceEmbeddings(model_name=get_model_path(model),
                                                        model_kwargs={'device': device})
                 item.obj = embeddings

diff --git a/server/llm_api_stale.py b/server/llm_api_stale.py
@@ -62,7 +62,7 @@
 parser.add_argument(
     "--device",
     type=str,
-    choices=["cpu", "cuda", "mps", "xpu"],
+    choices=["cpu", "cuda", "mps", "xpu", "npu"],
     default="cuda",
     help="The device type",
 )

diff --git a/server/utils.py b/server/utils.py
@@ -512,25 +512,28 @@ def _get_proxies():
 def detect_device() -> Literal["cuda", "mps", "cpu"]:
     try:
         import torch
+        import mindspore as ms
         if torch.cuda.is_available():
             return "cuda"
         if torch.backends.mps.is_available():
             return "mps"
+        if ms.get_context(attr_key='device_target') == 'Ascend':
+            return "npu"
     except:
         pass
     return "cpu"
 
 
-def llm_device(device: str = None) -> Literal["cuda", "mps", "cpu"]:
+def llm_device(device: str = None) -> Literal["cuda", "mps", "cpu", "npu"]:
     device = device or LLM_DEVICE
-    if device not in ["cuda", "mps", "cpu"]:
+    if device not in ["cuda", "mps", "cpu", "npu"]:
         device = detect_device()
     return device
 
 
-def embedding_device(device: str = None) -> Literal["cuda", "mps", "cpu"]:
+def embedding_device(device: str = None) -> Literal["cuda", "mps", "cpu", "npu"]:
     device = device or EMBEDDING_DEVICE
-    if device not in ["cuda", "mps", "cpu"]:
+    if device not in ["cuda", "mps", "cpu", "npu"]:
         device = detect_device()
     return device