Spaces:
Running
Running
Update app.py
Browse files
app.py
CHANGED
@@ -210,11 +210,14 @@ if fetch_data:
|
|
210 |
st.success("All records are complete!")
|
211 |
|
212 |
st.subheader("Suggested Metadata Enhancements")
|
213 |
-
|
214 |
-
|
215 |
-
|
|
|
216 |
suggestions = []
|
217 |
-
|
|
|
|
|
218 |
if pd.isna(row['subject']) and pd.notna(row['description']):
|
219 |
desc_vec = tfidf.transform([str(row['description'])])
|
220 |
sims = cosine_similarity(desc_vec, tfidf_matrix).flatten()
|
|
|
210 |
st.success("All records are complete!")
|
211 |
|
212 |
st.subheader("Suggested Metadata Enhancements")
|
213 |
+
incomplete_with_desc = incomplete_records[incomplete_records['description'].notnull()]
|
214 |
+
reference_df = metadata_df[metadata_df['subject'].notnull() & metadata_df['description'].notnull()]
|
215 |
+
tfidf = TfidfVectorizer(stop_words='english')
|
216 |
+
try:
|
217 |
suggestions = []
|
218 |
+
tfidf = TfidfVectorizer(stop_words='english')
|
219 |
+
tfidf_matrix = tfidf.fit_transform(reference_df['description'])
|
220 |
+
for idx, row in incomplete_with_desc.iterrows():
|
221 |
if pd.isna(row['subject']) and pd.notna(row['description']):
|
222 |
desc_vec = tfidf.transform([str(row['description'])])
|
223 |
sims = cosine_similarity(desc_vec, tfidf_matrix).flatten()
|