Spaces:

CCockrum
/

LOC-Metadate-Analyzer

Running

App Files Files Community

CCockrum commited on Apr 25

Commit

1ce0089

verified ·

1 Parent(s): 627b03f

Update app.py

Browse files

Files changed (1) hide show

app.py +27 -14

app.py CHANGED Viewed

@@ -34,20 +34,20 @@ st.markdown("""
             border-radius: 12px;
             margin-bottom: 1rem;
         }
-         .stAlert {
             background-color: #f0f0f5 !important;
-            color: #D3D3D3 !important;
             padding: 1.25rem !important;
             font-size: 1rem !important;
             border-radius: 0.5rem !important;
             box-shadow: 0 2px 5px rgba(0, 0, 0, 0.05) !important;
         }
         header[data-testid="stHeader"] {
-    background-color: gray !important;
 }
         section[data-testid="stSidebar"] > div:first-child {
     background-color: #1A1A1A !important;
-    color: #D3D3D3 !important;
     padding: 2rem 1.5rem 1.5rem 1.5rem !important;
     border-radius: 12px;
     box-shadow: 0 4px 12px rgba(0, 0, 0, 0.08);
@@ -60,16 +60,18 @@ st.markdown("""
     padding-left: 2rem !important;
     padding-right: 2rem !important;
     box-shadow: none !important;
 }
 </style>
 """, unsafe_allow_html=True)
 # Optional: Add a banner image (replace with your image URL)
-st.markdown('<img src="https://cdn-uploads.huggingface.co/production/uploads/67351c643fe51cb1aa28f2e5/7ThcAOjbuM8ajrP85bGs4.jpeg" class="banner">', unsafe_allow_html=True)
 # Streamlit app header
-st.title("LOC MetaDiscovery Agent")
 st.markdown("""
 This tool connects to the LOC API, retrieves metadata from a selected collection, and performs
 an analysis of metadata completeness, suggests enhancements, and identifies authority gaps.
@@ -88,11 +90,22 @@ st.sidebar.markdown("## Settings")
 selected = st.sidebar.selectbox("Select a collection", list(collections.keys()))
 search_query = collections[selected]
-# Use the main search endpoint (most reliable)
-collection_url = f"https://www.loc.gov/search/?q={search_query}&fo=json"
 st.sidebar.write(f"Selected Collection: {selected}")
 st.sidebar.markdown(f"<span style='color: lightgray;'>API URL: {collection_url}</span>", unsafe_allow_html=True)
 # Fetch data from LOC API with spoofed User-Agent header
 headers = {
@@ -155,11 +168,11 @@ def is_valid_date(value):
         return False
 if not metadata_df.empty:
-    st.subheader("Retrieved Metadata Sample")
     st.dataframe(metadata_df.head())
     # Metadata completeness analysis (enhanced)
-    st.subheader("Metadata Completeness Analysis")
     completeness = metadata_df.map(lambda x: not is_incomplete(x)).mean() * 100
     completeness_df = pd.DataFrame({"Field": completeness.index, "Completeness (%)": completeness.values})
     fig = px.bar(completeness_df, x="Field", y="Completeness (%)", title="Metadata Completeness by Field")
@@ -169,19 +182,19 @@ if not metadata_df.empty:
     incomplete_mask = metadata_df.map(is_incomplete).any(axis=1)
     incomplete_records = metadata_df[incomplete_mask]
-    st.subheader("Records with Incomplete Metadata")
     if not incomplete_records.empty:
         st.dataframe(incomplete_records.astype(str))
     else:
         st.success("All metadata fields are complete in this collection!")
-    st.subheader("Identifiers of Items Needing Metadata Updates")
     if not incomplete_records.empty:
         st.write(incomplete_records[['id', 'title']])
     else:
         st.success("All records are complete!")
-    st.subheader("Suggested Metadata Enhancements")
     filled_descriptions = metadata_df[metadata_df['description'].notnull()]['description'].astype(str)
     if len(filled_descriptions) > 1:
         try:

             border-radius: 12px;
             margin-bottom: 1rem;
         }
+                 .stAlert {
             background-color: #f0f0f5 !important;
+            color: #333333 !important;
             padding: 1.25rem !important;
             font-size: 1rem !important;
             border-radius: 0.5rem !important;
             box-shadow: 0 2px 5px rgba(0, 0, 0, 0.05) !important;
         }
         header[data-testid="stHeader"] {
+    background-color: #D3D3D3 !important;
 }
         section[data-testid="stSidebar"] > div:first-child {
     background-color: #1A1A1A !important;
+    color: #FFFFFF !important;
     padding: 2rem 1.5rem 1.5rem 1.5rem !important;
     border-radius: 12px;
     box-shadow: 0 4px 12px rgba(0, 0, 0, 0.08);
     padding-left: 2rem !important;
     padding-right: 2rem !important;
     box-shadow: none !important;
 }
+        html, body, [data-testid="stApp"] {
+            background-color: #FFFFFF !important;
+        }
 </style>
 """, unsafe_allow_html=True)
 # Optional: Add a banner image (replace with your image URL)
+st.image("banner.jpg", use_column_width=True)
 # Streamlit app header
+st.title("MetaDiscovery Agent for Library of Congress Collections")
 st.markdown("""
 This tool connects to the LOC API, retrieves metadata from a selected collection, and performs
 an analysis of metadata completeness, suggests enhancements, and identifies authority gaps.
 selected = st.sidebar.selectbox("Select a collection", list(collections.keys()))
 search_query = collections[selected]
+# About / Help
+with st.sidebar.expander("ℹ️ About This Tool"):
+    st.markdown(
+        "This agent audits and enhances metadata from Library of Congress digital collections. "
+        "Select a collection from the dropdown to begin your analysis."
+    )
+# Display API URL
 st.sidebar.write(f"Selected Collection: {selected}")
 st.sidebar.markdown(f"<span style='color: lightgray;'>API URL: {collection_url}</span>", unsafe_allow_html=True)
+# Summary Stats (conditionally displayed after data load)
+if 'metadata_df' in locals() and not metadata_df.empty:
+    st.sidebar.markdown("### 📊 Quick Stats")
+    st.sidebar.write(f"Total Records: {len(metadata_df)}")
+    st.sidebar.write(f"Incomplete Records: {incomplete_records.shape[0]}")
 # Fetch data from LOC API with spoofed User-Agent header
 headers = {
         return False
 if not metadata_df.empty:
+    st.subheader("📦 Retrieved Metadata Sample")
     st.dataframe(metadata_df.head())
     # Metadata completeness analysis (enhanced)
+    st.subheader("🧠 Metadata Completeness Analysis")
     completeness = metadata_df.map(lambda x: not is_incomplete(x)).mean() * 100
     completeness_df = pd.DataFrame({"Field": completeness.index, "Completeness (%)": completeness.values})
     fig = px.bar(completeness_df, x="Field", y="Completeness (%)", title="Metadata Completeness by Field")
     incomplete_mask = metadata_df.map(is_incomplete).any(axis=1)
     incomplete_records = metadata_df[incomplete_mask]
+    st.subheader("⚠️ Records with Incomplete Metadata")
     if not incomplete_records.empty:
         st.dataframe(incomplete_records.astype(str))
     else:
         st.success("All metadata fields are complete in this collection!")
+    st.subheader("📌 Identifiers of Items Needing Metadata Updates")
     if not incomplete_records.empty:
         st.write(incomplete_records[['id', 'title']])
     else:
         st.success("All records are complete!")
+    st.subheader("✨ Suggested Metadata Enhancements")
     filled_descriptions = metadata_df[metadata_df['description'].notnull()]['description'].astype(str)
     if len(filled_descriptions) > 1:
         try: