Spaces:
Running
Running
henok3878
commited on
Commit
·
44bb151
1
Parent(s):
56ecf7d
feature: add quantized model for cpu inference
Browse files- main.py +4 -0
- packaged_models/model.scripted.quantized.pt +2 -2
main.py
CHANGED
@@ -9,11 +9,13 @@ import logging
|
|
9 |
import time
|
10 |
from contextlib import asynccontextmanager
|
11 |
from inference_utils import construct_alphabet_list, convert_offsets_to_absolute_coords, encode_text, get_alphabet_map
|
|
|
12 |
|
13 |
logging.basicConfig(level=logging.INFO)
|
14 |
logger = logging.getLogger(__name__)
|
15 |
|
16 |
MODEL_DIR = Path("./packaged_models")
|
|
|
17 |
SCRIPTED_MODEL_NAME = "model.scripted.pt"
|
18 |
METADATA_MODEL_NAME = "model.pt"
|
19 |
|
@@ -62,6 +64,8 @@ async def lifespan(app: FastAPI):
|
|
62 |
|
63 |
scripted_model_path = MODEL_DIR / SCRIPTED_MODEL_NAME
|
64 |
metadata_model_path = MODEL_DIR / METADATA_MODEL_NAME
|
|
|
|
|
65 |
|
66 |
if not scripted_model_path.exists():
|
67 |
logger.error(f"Traced model not found at {scripted_model_path}")
|
|
|
9 |
import time
|
10 |
from contextlib import asynccontextmanager
|
11 |
from inference_utils import construct_alphabet_list, convert_offsets_to_absolute_coords, encode_text, get_alphabet_map
|
12 |
+
from ml.src.inference_benchmark import QUANTIZED_MODEL_NAME
|
13 |
|
14 |
logging.basicConfig(level=logging.INFO)
|
15 |
logger = logging.getLogger(__name__)
|
16 |
|
17 |
MODEL_DIR = Path("./packaged_models")
|
18 |
+
QUANTIZED_MODEL_NAME = "model.scripted.quantized.pt"
|
19 |
SCRIPTED_MODEL_NAME = "model.scripted.pt"
|
20 |
METADATA_MODEL_NAME = "model.pt"
|
21 |
|
|
|
64 |
|
65 |
scripted_model_path = MODEL_DIR / SCRIPTED_MODEL_NAME
|
66 |
metadata_model_path = MODEL_DIR / METADATA_MODEL_NAME
|
67 |
+
if device.type == "cpu":
|
68 |
+
scripted_model_path = MODEL_DIR / QUANTIZED_MODEL_NAME
|
69 |
|
70 |
if not scripted_model_path.exists():
|
71 |
logger.error(f"Traced model not found at {scripted_model_path}")
|
packaged_models/model.scripted.quantized.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c88342d00b8eb7d0380da89d9cf9f9744a9e6a7caac2f783f6b912d58c3129ac
|
3 |
+
size 4509816
|