Spaces:
Running
Running
Update app.py
Browse files
app.py
CHANGED
@@ -8,7 +8,7 @@ embedding_path = "abokbot/wikipedia-embedding"
|
|
8 |
|
9 |
st.header("Wikipedia Search Engine app")
|
10 |
|
11 |
-
st_model_load = st.text('Loading
|
12 |
|
13 |
@st.cache_resource
|
14 |
def load_embedding():
|
@@ -41,7 +41,7 @@ def load_wikipedia_dataset():
|
|
41 |
return dataset
|
42 |
|
43 |
dataset = load_wikipedia_dataset()
|
44 |
-
st.success('
|
45 |
st_model_load.text("")
|
46 |
|
47 |
if 'text' not in st.session_state:
|
@@ -82,14 +82,17 @@ def search():
|
|
82 |
print("\n-------------------------\n")
|
83 |
print("Top-3 Cross-Encoder Re-ranker hits")
|
84 |
st.subheader("Top-3 Search results")
|
85 |
-
results
|
86 |
-
for
|
87 |
-
results
|
88 |
-
|
89 |
-
|
90 |
-
|
91 |
-
|
92 |
-
|
|
|
|
|
|
|
93 |
st.session_state.results = results
|
94 |
|
95 |
|
@@ -102,7 +105,7 @@ print(st.session_state.results)
|
|
102 |
if len(st.session_state.results) > 0:
|
103 |
with st.container():
|
104 |
st.subheader("Search results")
|
105 |
-
for
|
106 |
st.markdown("score: " + result["score"])
|
107 |
st.markdown("title: " + result["title"])
|
108 |
st.markdown("abstract: " + result["abstract"])
|
|
|
8 |
|
9 |
st.header("Wikipedia Search Engine app")
|
10 |
|
11 |
+
st_model_load = st.text('Loading embeddings, encoders and dataset (takes about 5min)')
|
12 |
|
13 |
@st.cache_resource
|
14 |
def load_embedding():
|
|
|
41 |
return dataset
|
42 |
|
43 |
dataset = load_wikipedia_dataset()
|
44 |
+
st.success('App ready')
|
45 |
st_model_load.text("")
|
46 |
|
47 |
if 'text' not in st.session_state:
|
|
|
82 |
print("\n-------------------------\n")
|
83 |
print("Top-3 Cross-Encoder Re-ranker hits")
|
84 |
st.subheader("Top-3 Search results")
|
85 |
+
results = []
|
86 |
+
for hit in hits[:3]:
|
87 |
+
results.append
|
88 |
+
(
|
89 |
+
{
|
90 |
+
"score": round(hit['cross-score'], 3),
|
91 |
+
"title": dataset[hit['corpus_id']]["title"],
|
92 |
+
"abstract": dataset[hit['corpus_id']]["text"].replace("\n", " "),
|
93 |
+
"link": dataset[hit['corpus_id']]["url"]
|
94 |
+
}
|
95 |
+
)
|
96 |
st.session_state.results = results
|
97 |
|
98 |
|
|
|
105 |
if len(st.session_state.results) > 0:
|
106 |
with st.container():
|
107 |
st.subheader("Search results")
|
108 |
+
for result in st.session_state.results:
|
109 |
st.markdown("score: " + result["score"])
|
110 |
st.markdown("title: " + result["title"])
|
111 |
st.markdown("abstract: " + result["abstract"])
|