Update web_demo.py

使用更先进的方式加载模型
2023-06-30 10:26:50 +08:00 · 2023-06-30 10:26:50 +08:00 · 07d463034b
parent e84a5f3c14
commit 07d463034b
1 changed files with 1 additions and 1 deletions
--- a/web_demo.py
+++ b/web_demo.py
@ -4,7 +4,7 @@ import mdtex2html
 from utils import load_model_on_gpus

 tokenizer = AutoTokenizer.from_pretrained("THUDM/chatglm2-6b", trust_remote_code=True)
-model = AutoModel.from_pretrained("THUDM/chatglm2-6b", trust_remote_code=True).cuda()
+model = AutoModel.from_pretrained("THUDM/chatglm2-6b", trust_remote_code=True, device='cuda')#.cuda()
 # 多显卡支持，使用下面两行代替上面一行，将num_gpus改为你实际的显卡数量
 # from utils import load_model_on_gpus
 # model = load_model_on_gpus("THUDM/chatglm2-6b", num_gpus=2)