Spaces:
Sleeping
Sleeping
update GPU config
Browse files- config.py +20 -8
- data/anchor_name_sentence_embeddings_cl-nagoya-sup-simcse-ja-nss-v1_0_2.pkl +0 -3
- data/anchor_name_sentence_embeddings_cl-nagoya-sup-simcse-ja-nss-v_1_0_3.pkl +0 -3
- data/anchor_name_sentence_embeddings_cl-nagoya-sup-simcse-ja-nss-v_1_0_5.pkl +0 -3
- data/{anchor_name_sentence_embeddings_cl-nagoya-sup-simcse-ja-nss-v0_9_13_.pkl → anchor_name_sentence_embeddings_cl-nagoya-sup-simcse-ja-nss-v_1_0_6_bfloat16.pkl} +2 -2
- data/{anchor_name_sentence_embeddings_cl-nagoya-sup-simcse-ja-nss-v0_9_17.pkl → anchor_name_sentence_embeddings_cl-nagoya-sup-simcse-ja-nss-v_1_0_6_float16.pkl} +2 -2
- prepare.py +8 -5
- services/sentence_transformer_service.py +4 -4
config.py
CHANGED
@@ -13,13 +13,25 @@ OUTPUT_DIR = os.path.join(BASE_DIR, "outputs")
|
|
13 |
SUBJECT_DATA_FILE = os.path.join(DATA_DIR, "subjectData.csv")
|
14 |
SAMPLE_DATA_FILE = os.path.join(DATA_DIR, "sampleData.csv")
|
15 |
STANDARD_NAME_MAP_DATA_FILE = os.path.join(DATA_DIR, "standardData.csv")
|
16 |
-
|
17 |
-
|
18 |
-
|
19 |
-
DATA_DIR,
|
20 |
-
"anchor_name_sentence_embeddings_cl-nagoya-sup-simcse-ja-nss-v_1_0_6.pkl",
|
21 |
-
)
|
22 |
-
# SENTENCE_EMBEDDING_FILE = None
|
23 |
MODEL_TYPE = None
|
24 |
DEVICE_TYPE = "cpu"
|
25 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
13 |
SUBJECT_DATA_FILE = os.path.join(DATA_DIR, "subjectData.csv")
|
14 |
SAMPLE_DATA_FILE = os.path.join(DATA_DIR, "sampleData.csv")
|
15 |
STANDARD_NAME_MAP_DATA_FILE = os.path.join(DATA_DIR, "standardData.csv")
|
16 |
+
|
17 |
+
# Model Config
|
18 |
+
HALF = "float16"
|
|
|
|
|
|
|
|
|
19 |
MODEL_TYPE = None
|
20 |
DEVICE_TYPE = "cpu"
|
21 |
+
MODEL_NAME = "Detomo/cl-nagoya-sup-simcse-ja-nss-v_1_0_6"
|
22 |
+
if HALF == "float16":
|
23 |
+
SENTENCE_EMBEDDING_FILE = os.path.join(
|
24 |
+
DATA_DIR,
|
25 |
+
"anchor_name_sentence_embeddings_cl-nagoya-sup-simcse-ja-nss-v_1_0_6_float16.pkl",
|
26 |
+
)
|
27 |
+
elif HALF == "bfloat16":
|
28 |
+
SENTENCE_EMBEDDING_FILE = os.path.join(
|
29 |
+
DATA_DIR,
|
30 |
+
"anchor_name_sentence_embeddings_cl-nagoya-sup-simcse-ja-nss-v_1_0_6_bfloat16.pkl",
|
31 |
+
)
|
32 |
+
else:
|
33 |
+
SENTENCE_EMBEDDING_FILE = os.path.join(
|
34 |
+
DATA_DIR,
|
35 |
+
"anchor_name_sentence_embeddings_cl-nagoya-sup-simcse-ja-nss-v_1_0_6.pkl",
|
36 |
+
)
|
37 |
+
# SENTENCE_EMBEDDING_FILE = None
|
data/anchor_name_sentence_embeddings_cl-nagoya-sup-simcse-ja-nss-v1_0_2.pkl
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:51d2c6c83a577d6afb5701de785405f950a5fcd4c9013ca1dfab53f7d9e5739d
|
3 |
-
size 18373796
|
|
|
|
|
|
|
|
data/anchor_name_sentence_embeddings_cl-nagoya-sup-simcse-ja-nss-v_1_0_3.pkl
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:482862ee6138c60ce27604aee19f66ee6d2835cfd08907145d9df65d65829259
|
3 |
-
size 19547300
|
|
|
|
|
|
|
|
data/anchor_name_sentence_embeddings_cl-nagoya-sup-simcse-ja-nss-v_1_0_5.pkl
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:c82797adfac6a639b7566fdd424f876273177e4ebb4a5279889d73e41630b7bd
|
3 |
-
size 21209252
|
|
|
|
|
|
|
|
data/{anchor_name_sentence_embeddings_cl-nagoya-sup-simcse-ja-nss-v0_9_13_.pkl → anchor_name_sentence_embeddings_cl-nagoya-sup-simcse-ja-nss-v_1_0_6_bfloat16.pkl}
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:042dcf97e2e686a956e3311e897e1707e330ff1413bf3310cd8ea8b0393abf4c
|
3 |
+
size 21888164
|
data/{anchor_name_sentence_embeddings_cl-nagoya-sup-simcse-ja-nss-v0_9_17.pkl → anchor_name_sentence_embeddings_cl-nagoya-sup-simcse-ja-nss-v_1_0_6_float16.pkl}
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a7eb117306729208293b84057ca01d8fa6238dc5be1f69c3ad452ba84fa6c6bf
|
3 |
+
size 10944164
|
prepare.py
CHANGED
@@ -27,13 +27,16 @@ def export_model(backend="onnx", use_qint8=False):
|
|
27 |
model, "avx512_vnni", MODEL_NAME, push_to_hub=True
|
28 |
)
|
29 |
else:
|
30 |
-
model.push_to_hub(MODEL_NAME)
|
31 |
else:
|
32 |
raise ValueError(f"Invalid backend: {backend}")
|
33 |
|
34 |
|
35 |
# Export all combinations
|
36 |
-
backend = "
|
37 |
-
use_qint8 = False
|
38 |
-
print(f"Exporting {backend} model with QINT8={use_qint8}")
|
39 |
-
export_model(backend=backend, use_qint8=use_qint8)
|
|
|
|
|
|
|
|
27 |
model, "avx512_vnni", MODEL_NAME, push_to_hub=True
|
28 |
)
|
29 |
else:
|
30 |
+
model.push_to_hub(MODEL_NAME, create_pr=True)
|
31 |
else:
|
32 |
raise ValueError(f"Invalid backend: {backend}")
|
33 |
|
34 |
|
35 |
# Export all combinations
|
36 |
+
# backend = "onnx"
|
37 |
+
# use_qint8 = False
|
38 |
+
# print(f"Exporting {backend} model with QINT8={use_qint8}")
|
39 |
+
# export_model(backend=backend, use_qint8=use_qint8)
|
40 |
+
|
41 |
+
# import tensorrt as trt
|
42 |
+
# print(trt.__version__)
|
services/sentence_transformer_service.py
CHANGED
@@ -1,8 +1,8 @@
|
|
1 |
import pickle
|
2 |
from config import (
|
3 |
MODEL_NAME, MODEL_TYPE, DEVICE_TYPE,
|
4 |
-
SENTENCE_EMBEDDING_FILE,
|
5 |
-
STANDARD_NAME_MAP_DATA_FILE, SUBJECT_DATA_FILE, DATA_DIR,
|
6 |
)
|
7 |
from sentence_transformer_lib.sentence_transformer_helper import SentenceTransformerHelper
|
8 |
from data_lib.subject_data import SubjectData
|
@@ -25,11 +25,11 @@ class SentenceTransformerService:
|
|
25 |
|
26 |
print("Loading models and data...")
|
27 |
# Load sentence transformer model
|
28 |
-
print(f"Loading model {MODEL_NAME} with type {MODEL_TYPE} and
|
29 |
self.sentenceTransformerHelper = SentenceTransformerHelper(
|
30 |
model_name=MODEL_NAME,
|
31 |
model_type=MODEL_TYPE,
|
32 |
-
|
33 |
)
|
34 |
# Load standard subject dictionary
|
35 |
self.dic_standard_subject = SubjectData.create_standard_subject_dic_from_file(SUBJECT_DATA_FILE)
|
|
|
1 |
import pickle
|
2 |
from config import (
|
3 |
MODEL_NAME, MODEL_TYPE, DEVICE_TYPE,
|
4 |
+
SENTENCE_EMBEDDING_FILE,
|
5 |
+
STANDARD_NAME_MAP_DATA_FILE, SUBJECT_DATA_FILE, DATA_DIR, HALF
|
6 |
)
|
7 |
from sentence_transformer_lib.sentence_transformer_helper import SentenceTransformerHelper
|
8 |
from data_lib.subject_data import SubjectData
|
|
|
25 |
|
26 |
print("Loading models and data...")
|
27 |
# Load sentence transformer model
|
28 |
+
print(f"Loading model {MODEL_NAME} with type {MODEL_TYPE} and half={HALF}")
|
29 |
self.sentenceTransformerHelper = SentenceTransformerHelper(
|
30 |
model_name=MODEL_NAME,
|
31 |
model_type=MODEL_TYPE,
|
32 |
+
half=HALF
|
33 |
)
|
34 |
# Load standard subject dictionary
|
35 |
self.dic_standard_subject = SubjectData.create_standard_subject_dic_from_file(SUBJECT_DATA_FILE)
|