Update app.py
Browse files
app.py
CHANGED
|
@@ -3,6 +3,13 @@ import numpy as np
|
|
| 3 |
import os
|
| 4 |
from sentence_transformers import SentenceTransformer
|
| 5 |
from transformers import RagTokenizer, RagRetriever, RagSequenceForGeneration
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 6 |
|
| 7 |
# 使用更轻量的模型 - 添加 token 参数
|
| 8 |
model_name = "all-MiniLM-L6-v2"
|
|
|
|
| 3 |
import os
|
| 4 |
from sentence_transformers import SentenceTransformer
|
| 5 |
from transformers import RagTokenizer, RagRetriever, RagSequenceForGeneration
|
| 6 |
+
import os
|
| 7 |
+
|
| 8 |
+
# 设置内存交换参数
|
| 9 |
+
os.environ["PYTORCH_CUDA_ALLOC_CONF"] = "max_split_size_mb:32"
|
| 10 |
+
|
| 11 |
+
# 设置默认线程数
|
| 12 |
+
torch.set_num_threads(1) # 减少内存占用
|
| 13 |
|
| 14 |
# 使用更轻量的模型 - 添加 token 参数
|
| 15 |
model_name = "all-MiniLM-L6-v2"
|