Spaces:
Runtime error
Runtime error
thomas-yanxin
commited on
Commit
·
dc18ab0
1
Parent(s):
ed22028
update
Browse files- app.py +0 -1
- chatllm.py +1 -1
app.py
CHANGED
|
@@ -26,7 +26,6 @@ embedding_model_dict = {
|
|
| 26 |
|
| 27 |
llm_model_dict = {
|
| 28 |
"ChatGLM-6B-int4": "THUDM/chatglm-6b-int4",
|
| 29 |
-
"ChatGLM-6B-int8": "THUDM/chatglm-6b-int8",
|
| 30 |
"ChatGLM-6b-int4-qe": "THUDM/chatglm-6b-int4-qe",
|
| 31 |
"Minimax": "Minimax"
|
| 32 |
}
|
|
|
|
| 26 |
|
| 27 |
llm_model_dict = {
|
| 28 |
"ChatGLM-6B-int4": "THUDM/chatglm-6b-int4",
|
|
|
|
| 29 |
"ChatGLM-6b-int4-qe": "THUDM/chatglm-6b-int4-qe",
|
| 30 |
"Minimax": "Minimax"
|
| 31 |
}
|
chatllm.py
CHANGED
|
@@ -9,7 +9,7 @@ from transformers import AutoModel, AutoTokenizer
|
|
| 9 |
|
| 10 |
os.environ["TOKENIZERS_PARALLELISM"] = "false"
|
| 11 |
|
| 12 |
-
DEVICE = "
|
| 13 |
DEVICE_ID = "0"
|
| 14 |
CUDA_DEVICE = f"{DEVICE}:{DEVICE_ID}" if DEVICE_ID else DEVICE
|
| 15 |
|
|
|
|
| 9 |
|
| 10 |
os.environ["TOKENIZERS_PARALLELISM"] = "false"
|
| 11 |
|
| 12 |
+
DEVICE = "cuda"
|
| 13 |
DEVICE_ID = "0"
|
| 14 |
CUDA_DEVICE = f"{DEVICE}:{DEVICE_ID}" if DEVICE_ID else DEVICE
|
| 15 |
|