vumichien commited on
Commit
c41415e
·
1 Parent(s): c1cf1c2

update GPU config

Browse files
config.py CHANGED
@@ -13,13 +13,25 @@ OUTPUT_DIR = os.path.join(BASE_DIR, "outputs")
13
  SUBJECT_DATA_FILE = os.path.join(DATA_DIR, "subjectData.csv")
14
  SAMPLE_DATA_FILE = os.path.join(DATA_DIR, "sampleData.csv")
15
  STANDARD_NAME_MAP_DATA_FILE = os.path.join(DATA_DIR, "standardData.csv")
16
- # Model Names
17
- MODEL_NAME = "Detomo/cl-nagoya-sup-simcse-ja-nss-v_1_0_6"
18
- SENTENCE_EMBEDDING_FILE = os.path.join(
19
- DATA_DIR,
20
- "anchor_name_sentence_embeddings_cl-nagoya-sup-simcse-ja-nss-v_1_0_6.pkl",
21
- )
22
- # SENTENCE_EMBEDDING_FILE = None
23
  MODEL_TYPE = None
24
  DEVICE_TYPE = "cpu"
25
- QINT8 = False
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
13
  SUBJECT_DATA_FILE = os.path.join(DATA_DIR, "subjectData.csv")
14
  SAMPLE_DATA_FILE = os.path.join(DATA_DIR, "sampleData.csv")
15
  STANDARD_NAME_MAP_DATA_FILE = os.path.join(DATA_DIR, "standardData.csv")
16
+
17
+ # Model Config
18
+ HALF = "float16"
 
 
 
 
19
  MODEL_TYPE = None
20
  DEVICE_TYPE = "cpu"
21
+ MODEL_NAME = "Detomo/cl-nagoya-sup-simcse-ja-nss-v_1_0_6"
22
+ if HALF == "float16":
23
+ SENTENCE_EMBEDDING_FILE = os.path.join(
24
+ DATA_DIR,
25
+ "anchor_name_sentence_embeddings_cl-nagoya-sup-simcse-ja-nss-v_1_0_6_float16.pkl",
26
+ )
27
+ elif HALF == "bfloat16":
28
+ SENTENCE_EMBEDDING_FILE = os.path.join(
29
+ DATA_DIR,
30
+ "anchor_name_sentence_embeddings_cl-nagoya-sup-simcse-ja-nss-v_1_0_6_bfloat16.pkl",
31
+ )
32
+ else:
33
+ SENTENCE_EMBEDDING_FILE = os.path.join(
34
+ DATA_DIR,
35
+ "anchor_name_sentence_embeddings_cl-nagoya-sup-simcse-ja-nss-v_1_0_6.pkl",
36
+ )
37
+ # SENTENCE_EMBEDDING_FILE = None
data/anchor_name_sentence_embeddings_cl-nagoya-sup-simcse-ja-nss-v1_0_2.pkl DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:51d2c6c83a577d6afb5701de785405f950a5fcd4c9013ca1dfab53f7d9e5739d
3
- size 18373796
 
 
 
 
data/anchor_name_sentence_embeddings_cl-nagoya-sup-simcse-ja-nss-v_1_0_3.pkl DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:482862ee6138c60ce27604aee19f66ee6d2835cfd08907145d9df65d65829259
3
- size 19547300
 
 
 
 
data/anchor_name_sentence_embeddings_cl-nagoya-sup-simcse-ja-nss-v_1_0_5.pkl DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:c82797adfac6a639b7566fdd424f876273177e4ebb4a5279889d73e41630b7bd
3
- size 21209252
 
 
 
 
data/{anchor_name_sentence_embeddings_cl-nagoya-sup-simcse-ja-nss-v0_9_13_.pkl → anchor_name_sentence_embeddings_cl-nagoya-sup-simcse-ja-nss-v_1_0_6_bfloat16.pkl} RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1209c010eda0150d859ee2b3c9a889ab2bb6f69a65adafbae9ec8f7ffa813962
3
- size 12251300
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:042dcf97e2e686a956e3311e897e1707e330ff1413bf3310cd8ea8b0393abf4c
3
+ size 21888164
data/{anchor_name_sentence_embeddings_cl-nagoya-sup-simcse-ja-nss-v0_9_17.pkl → anchor_name_sentence_embeddings_cl-nagoya-sup-simcse-ja-nss-v_1_0_6_float16.pkl} RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ae5fab42d01409975e99f20e4907e42e770191ba212c9ccfcc6fe88f6db37ff0
3
- size 16392356
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a7eb117306729208293b84057ca01d8fa6238dc5be1f69c3ad452ba84fa6c6bf
3
+ size 10944164
prepare.py CHANGED
@@ -27,13 +27,16 @@ def export_model(backend="onnx", use_qint8=False):
27
  model, "avx512_vnni", MODEL_NAME, push_to_hub=True
28
  )
29
  else:
30
- model.push_to_hub(MODEL_NAME)
31
  else:
32
  raise ValueError(f"Invalid backend: {backend}")
33
 
34
 
35
  # Export all combinations
36
- backend = "openvino"
37
- use_qint8 = False
38
- print(f"Exporting {backend} model with QINT8={use_qint8}")
39
- export_model(backend=backend, use_qint8=use_qint8)
 
 
 
 
27
  model, "avx512_vnni", MODEL_NAME, push_to_hub=True
28
  )
29
  else:
30
+ model.push_to_hub(MODEL_NAME, create_pr=True)
31
  else:
32
  raise ValueError(f"Invalid backend: {backend}")
33
 
34
 
35
  # Export all combinations
36
+ # backend = "onnx"
37
+ # use_qint8 = False
38
+ # print(f"Exporting {backend} model with QINT8={use_qint8}")
39
+ # export_model(backend=backend, use_qint8=use_qint8)
40
+
41
+ # import tensorrt as trt
42
+ # print(trt.__version__)
services/sentence_transformer_service.py CHANGED
@@ -1,8 +1,8 @@
1
  import pickle
2
  from config import (
3
  MODEL_NAME, MODEL_TYPE, DEVICE_TYPE,
4
- SENTENCE_EMBEDDING_FILE,
5
- STANDARD_NAME_MAP_DATA_FILE, SUBJECT_DATA_FILE, DATA_DIR, QINT8
6
  )
7
  from sentence_transformer_lib.sentence_transformer_helper import SentenceTransformerHelper
8
  from data_lib.subject_data import SubjectData
@@ -25,11 +25,11 @@ class SentenceTransformerService:
25
 
26
  print("Loading models and data...")
27
  # Load sentence transformer model
28
- print(f"Loading model {MODEL_NAME} with type {MODEL_TYPE} and qint8={QINT8}")
29
  self.sentenceTransformerHelper = SentenceTransformerHelper(
30
  model_name=MODEL_NAME,
31
  model_type=MODEL_TYPE,
32
- qint8=QINT8
33
  )
34
  # Load standard subject dictionary
35
  self.dic_standard_subject = SubjectData.create_standard_subject_dic_from_file(SUBJECT_DATA_FILE)
 
1
  import pickle
2
  from config import (
3
  MODEL_NAME, MODEL_TYPE, DEVICE_TYPE,
4
+ SENTENCE_EMBEDDING_FILE,
5
+ STANDARD_NAME_MAP_DATA_FILE, SUBJECT_DATA_FILE, DATA_DIR, HALF
6
  )
7
  from sentence_transformer_lib.sentence_transformer_helper import SentenceTransformerHelper
8
  from data_lib.subject_data import SubjectData
 
25
 
26
  print("Loading models and data...")
27
  # Load sentence transformer model
28
+ print(f"Loading model {MODEL_NAME} with type {MODEL_TYPE} and half={HALF}")
29
  self.sentenceTransformerHelper = SentenceTransformerHelper(
30
  model_name=MODEL_NAME,
31
  model_type=MODEL_TYPE,
32
+ half=HALF
33
  )
34
  # Load standard subject dictionary
35
  self.dic_standard_subject = SubjectData.create_standard_subject_dic_from_file(SUBJECT_DATA_FILE)