GOGO198 commited on
Commit
1b59f0f
·
verified ·
1 Parent(s): 04df201

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +7 -0
app.py CHANGED
@@ -3,6 +3,13 @@ import numpy as np
3
  import os
4
  from sentence_transformers import SentenceTransformer
5
  from transformers import RagTokenizer, RagRetriever, RagSequenceForGeneration
 
 
 
 
 
 
 
6
 
7
  # 使用更轻量的模型 - 添加 token 参数
8
  model_name = "all-MiniLM-L6-v2"
 
3
  import os
4
  from sentence_transformers import SentenceTransformer
5
  from transformers import RagTokenizer, RagRetriever, RagSequenceForGeneration
6
+ import os
7
+
8
+ # 设置内存交换参数
9
+ os.environ["PYTORCH_CUDA_ALLOC_CONF"] = "max_split_size_mb:32"
10
+
11
+ # 设置默认线程数
12
+ torch.set_num_threads(1) # 减少内存占用
13
 
14
  # 使用更轻量的模型 - 添加 token 参数
15
  model_name = "all-MiniLM-L6-v2"