Spaces:
Runtime error
Runtime error
Commit
·
57a9e1d
1
Parent(s):
0d887dc
first attempt to hf spaces
Browse files- config/config.yaml +3 -0
- requirements.txt +0 -2
- src/demo.py +8 -4
- src/gradio.py +17 -0
config/config.yaml
CHANGED
@@ -20,6 +20,9 @@ debug:
|
|
20 |
is_debug: false
|
21 |
force_rebuild_storage: false
|
22 |
|
|
|
|
|
|
|
23 |
|
24 |
hydra:
|
25 |
verbose: false
|
|
|
20 |
is_debug: false
|
21 |
force_rebuild_storage: false
|
22 |
|
23 |
+
document_parsing:
|
24 |
+
enabled: false
|
25 |
+
|
26 |
|
27 |
hydra:
|
28 |
verbose: false
|
requirements.txt
CHANGED
@@ -35,7 +35,6 @@ cryptography==41.0.2
|
|
35 |
cupy==12.1.0
|
36 |
cycler==0.12.0
|
37 |
cymem==2.0.7
|
38 |
-
dataclasses==0.8
|
39 |
dataclasses-json==0.5.7
|
40 |
datasets==2.14.2
|
41 |
debugpy==1.6.7
|
@@ -43,7 +42,6 @@ decorator==5.1.1
|
|
43 |
defusedxml==0.7.1
|
44 |
dill==0.3.7
|
45 |
effdet==0.4.1
|
46 |
-
en-core-web-trf==3.6.1
|
47 |
entrypoints==0.4
|
48 |
et-xmlfile==1.1.0
|
49 |
exceptiongroup==1.1.2
|
|
|
35 |
cupy==12.1.0
|
36 |
cycler==0.12.0
|
37 |
cymem==2.0.7
|
|
|
38 |
dataclasses-json==0.5.7
|
39 |
datasets==2.14.2
|
40 |
debugpy==1.6.7
|
|
|
42 |
defusedxml==0.7.1
|
43 |
dill==0.3.7
|
44 |
effdet==0.4.1
|
|
|
45 |
entrypoints==0.4
|
46 |
et-xmlfile==1.1.0
|
47 |
exceptiongroup==1.1.2
|
src/demo.py
CHANGED
@@ -55,10 +55,11 @@ class App:
|
|
55 |
def __init__(self, cfg : DictConfig) -> None:
|
56 |
self.cfg = cfg
|
57 |
|
58 |
-
|
59 |
-
|
60 |
-
|
61 |
-
|
|
|
62 |
log.info("Loading: Text Embedding Model")
|
63 |
self.text_embedding_model = hydra.utils.instantiate(cfg.text_embedding)
|
64 |
log.info("Loading: Vector Store")
|
@@ -73,6 +74,9 @@ class App:
|
|
73 |
# if vector store exists, load it
|
74 |
|
75 |
if not Path(self.cfg.storage_path.vector_store).exists() or self.cfg.debug.force_rebuild_storage:
|
|
|
|
|
|
|
76 |
message = (
|
77 |
"Vector store not found at %s. Building storage from scratch"
|
78 |
if not self.cfg.debug.force_rebuild_storage
|
|
|
55 |
def __init__(self, cfg : DictConfig) -> None:
|
56 |
self.cfg = cfg
|
57 |
|
58 |
+
if cfg.document_parsing.enabled:
|
59 |
+
log.info("Loading: Document Loader")
|
60 |
+
self.loader = hydra.utils.instantiate(cfg.document_loader)
|
61 |
+
log.info("Loading: Text Splitter")
|
62 |
+
self.splitter = hydra.utils.instantiate(cfg.text_splitter)
|
63 |
log.info("Loading: Text Embedding Model")
|
64 |
self.text_embedding_model = hydra.utils.instantiate(cfg.text_embedding)
|
65 |
log.info("Loading: Vector Store")
|
|
|
74 |
# if vector store exists, load it
|
75 |
|
76 |
if not Path(self.cfg.storage_path.vector_store).exists() or self.cfg.debug.force_rebuild_storage:
|
77 |
+
if not self.cfg.document_parsing.enabled:
|
78 |
+
raise ValueError("Document parsing is not enabled. Cannot build storage from scratch")
|
79 |
+
|
80 |
message = (
|
81 |
"Vector store not found at %s. Building storage from scratch"
|
82 |
if not self.cfg.debug.force_rebuild_storage
|
src/gradio.py
ADDED
@@ -0,0 +1,17 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
import gradio as gr
|
2 |
+
from hydra import compose, initialize
|
3 |
+
from omegaconf import OmegaConf
|
4 |
+
|
5 |
+
from demo import App
|
6 |
+
|
7 |
+
def main():
|
8 |
+
with initialize(version_base=None, config_path="../config", job_name="gradio_app"):
|
9 |
+
cfg = compose(config_name="config", overrides=["document_parsing.enabled=False"])
|
10 |
+
|
11 |
+
app = App(cfg)
|
12 |
+
|
13 |
+
webapp = gr.ChatInterface(fn=app.ask_chat, examples=["hello", "hola", "merhaba"], title="LLM4SciLit")
|
14 |
+
webapp.launch(share=True)
|
15 |
+
|
16 |
+
if __name__ == "__main__":
|
17 |
+
main()
|