Update app.py
Browse files
app.py
CHANGED
@@ -12,8 +12,9 @@ CACHE_DIR = "/home/user/cache"
|
|
12 |
os.makedirs(CACHE_DIR, exist_ok=True)
|
13 |
|
14 |
# 减少内存占用
|
15 |
-
os.environ["PYTORCH_CUDA_ALLOC_CONF"] = "max_split_size_mb:32"
|
16 |
-
torch.set_num_threads(1)
|
|
|
17 |
|
18 |
# 全局变量 - 移除了clip_model和clip_processor
|
19 |
index = None
|
@@ -71,6 +72,8 @@ def load_resources():
|
|
71 |
print(f"❌ 元数据加载失败: {str(e)}")
|
72 |
raise
|
73 |
|
|
|
|
|
74 |
def predict(vector):
|
75 |
"""处理768维向量输入并返回答案"""
|
76 |
print(f"输入向量维度: {np.array(vector).shape}")
|
|
|
12 |
os.makedirs(CACHE_DIR, exist_ok=True)
|
13 |
|
14 |
# 减少内存占用
|
15 |
+
# os.environ["PYTORCH_CUDA_ALLOC_CONF"] = "max_split_size_mb:32"
|
16 |
+
# torch.set_num_threads(1)
|
17 |
+
os.environ["OMP_NUM_THREADS"] = "8"
|
18 |
|
19 |
# 全局变量 - 移除了clip_model和clip_processor
|
20 |
index = None
|
|
|
72 |
print(f"❌ 元数据加载失败: {str(e)}")
|
73 |
raise
|
74 |
|
75 |
+
from functools import lru_cache
|
76 |
+
@lru_cache(maxsize=1000)
|
77 |
def predict(vector):
|
78 |
"""处理768维向量输入并返回答案"""
|
79 |
print(f"输入向量维度: {np.array(vector).shape}")
|