Spaces:

awacke1
/

Freedom-of-Information-Act-FOIA-Datasets

Sleeping

App Files Files Community

awacke1 commited on Mar 19

Commit

42786d7

verified ·

1 Parent(s): 0d8fa25

Update app.py

Browse files

Files changed (1) hide show

app.py +52 -14

app.py CHANGED Viewed

@@ -6,7 +6,6 @@ import os
 import xml.etree.ElementTree as ET
 from typing import Dict, List
-# Function to parse XML and build AGENCIES dictionary
 def load_agencies_from_xml() -> Dict:
     AGENCIES = {}
     xml_files = [f for f in os.listdir('.') if f.endswith('.xml')]
@@ -27,20 +26,19 @@ def load_agencies_from_xml() -> Dict:
                 abbr = org.find("nc:OrganizationAbbreviationText", ns).text
                 fiscal_year = root.find(".//foia:DocumentFiscalYearDate", ns).text if root.find(".//foia:DocumentFiscalYearDate", ns) is not None else "N/A"
-                # Build minimal agency data (can be expanded with more XML data)
                 AGENCIES[name] = {
                     "name": name,
                     "summary": {
                         "name": name,
                         "description": f"FOIA data for {name} ({fiscal_year})",
                         "abbreviation": abbr,
-                        "website": f"https://www.{abbr.lower()}.gov"  # Guessed URL, adjust as needed
                     },
                     "website": f"https://www.{abbr.lower()}.gov",
-                    "emails": [f"foia@{abbr.lower()}.gov"],  # Guessed email
-                    "address": {"address_lines": [], "street": "", "city": "", "state": "", "zip": ""},  # Placeholder
-                    "service_center": {"phone": ["N/A"]},  # Placeholder
-                    "request_form": f"https://www.{abbr.lower()}.gov/foia",  # Guessed form URL
                     "request_time_stats": {
                         fiscal_year: {
                             "simple_median_days": float(root.find(".//foia:ProcessedResponseTimeSection/foia:ProcessedResponseTime/foia:SimpleResponseTime/foia:ResponseTimeMedianDaysValue", ns).text) if root.find(".//foia:ProcessedResponseTimeSection/foia:ProcessedResponseTime/foia:SimpleResponseTime/foia:ResponseTimeMedianDaysValue", ns) is not None else 0
@@ -93,12 +91,36 @@ class Agency:
     def hasRequestForm(self) -> bool:
         return bool(self.request_form)
 def create_search_url_wikipedia(search_query):
     base_url = "https://www.wikipedia.org/search-redirect.php?family=wikipedia&language=en&search="
     return base_url + search_query.replace(' ', '+').replace('–', '%E2%80%93').replace('&', 'and')
 def parse_foia_xml(filename: str) -> Dict:
-    """Parse FOIA XML file and return key information"""
     try:
         tree = ET.parse(filename)
         root = tree.getroot()
@@ -131,9 +153,18 @@ def list_and_display_xml_files():
         return
     for xml_file in xml_files:
-        file_name = xml_file[:-4]  # Remove .xml extension
         data = parse_foia_xml(xml_file)
         with st.expander(f"📋 {file_name} - {data['name']} ({data['abbr']})"):
             st.write(f"📅 Fiscal Year: {data['fiscal_year']}")
             st.write(f"⏳ Pending at Start: {data['pending_start']}")
             st.write(f"📥 Received: {data['received']}")
@@ -154,11 +185,16 @@ def search_foia_content(query: str, agency: str = None) -> Dict:
     return results
 def main():
-    # Load agencies from XML files
     AGENCIES = load_agencies_from_xml()
     st.title("Freedom of Information Act (FOIA) Explorer 🌍📊")
     st.write("""
     The Freedom of Information Act (FOIA) empowers individuals by granting access to previously unreleased information and documents controlled by the United States government. Championing transparency and accountability, FOIA serves as a foundation for democratic engagement and open government initiatives. 🎉✨
     Below is a list of datasets available under FOIA, alongside guessed Wikipedia URLs for more information. 📚🔍
@@ -169,7 +205,6 @@ def main():
     - [Data.Gov](https://catalog.data.gov/dataset?tags=foia)
     """)
-    # FOIA Datasets with Emojis
     datasets = [
         ("Provider Taxonomy", "🩺"),
         ("Consumer Complaint Database", "📞"),
@@ -185,7 +220,6 @@ def main():
     for dataset, emoji in datasets:
         st.markdown(f"- {emoji} **{dataset}**: [Wikipedia]({create_search_url_wikipedia(dataset)})")
-    # Agency Browser
     st.header("Agency Browser")
     agency_names = sorted(list(AGENCIES.keys()))
     selected_agency = st.selectbox("Select Agency", [""] + agency_names)
@@ -193,6 +227,12 @@ def main():
     if selected_agency:
         agency = Agency(AGENCIES[selected_agency])
         st.subheader(f"{agency.name} Details")
         st.write(f"Description: {agency.summary.get('description', 'N/A')}")
         st.write(f"Abbreviation: {agency.summary.get('abbreviation', 'N/A')}")
         if agency.website:
@@ -224,7 +264,6 @@ def main():
                         if "median" in key:
                             st.write(f"{key.replace('_median_days', '').title()}: {value} days")
-    # FOIA Document Search
     st.subheader("Search FOIA Documents")
     search_query = st.text_input("Enter search query")
     if st.button("Search") and search_query:
@@ -234,7 +273,6 @@ def main():
             for result in results["results"]:
                 st.write(f"- {result['title']} ({result['date']})")
-    # XML Files Display
     st.header("FOIA XML Reports")
     list_and_display_xml_files()

 import xml.etree.ElementTree as ET
 from typing import Dict, List
 def load_agencies_from_xml() -> Dict:
     AGENCIES = {}
     xml_files = [f for f in os.listdir('.') if f.endswith('.xml')]
                 abbr = org.find("nc:OrganizationAbbreviationText", ns).text
                 fiscal_year = root.find(".//foia:DocumentFiscalYearDate", ns).text if root.find(".//foia:DocumentFiscalYearDate", ns) is not None else "N/A"
                 AGENCIES[name] = {
                     "name": name,
                     "summary": {
                         "name": name,
                         "description": f"FOIA data for {name} ({fiscal_year})",
                         "abbreviation": abbr,
+                        "website": f"https://www.{abbr.lower()}.gov"
                     },
                     "website": f"https://www.{abbr.lower()}.gov",
+                    "emails": [f"foia@{abbr.lower()}.gov"],
+                    "address": {"address_lines": [], "street": "", "city": "", "state": "", "zip": ""},
+                    "service_center": {"phone": ["N/A"]},
+                    "request_form": f"https://www.{abbr.lower()}.gov/foia",
                     "request_time_stats": {
                         fiscal_year: {
                             "simple_median_days": float(root.find(".//foia:ProcessedResponseTimeSection/foia:ProcessedResponseTime/foia:SimpleResponseTime/foia:ResponseTimeMedianDaysValue", ns).text) if root.find(".//foia:ProcessedResponseTimeSection/foia:ProcessedResponseTime/foia:SimpleResponseTime/foia:ResponseTimeMedianDaysValue", ns) is not None else 0
     def hasRequestForm(self) -> bool:
         return bool(self.request_form)
+AGENCY_LOGOS = {
+    "CFA": "https://upload.wikimedia.org/wikipedia/en/e/e8/U.S._Commission_of_Fine_Arts_logo.png",
+    "CEQ": "https://upload.wikimedia.org/wikipedia/commons/5/58/CEQ-Seal.png",
+    "DOJ": "https://upload.wikimedia.org/wikipedia/commons/f/f8/Seal_of_the_United_States_Department_of_Justice.svg",
+    "EPA": "https://upload.wikimedia.org/wikipedia/commons/7/78/Environmental_Protection_Agency_logo.svg",
+    "FTC": "https://upload.wikimedia.org/wikipedia/commons/5/5b/US-FederalTradeCommission-Seal.svg",
+    "ABMC": "https://upload.wikimedia.org/wikipedia/commons/2/2f/ABMC_seal.png",
+    "AFRH": "https://upload.wikimedia.org/wikipedia/commons/2/2e/Armed_Forces_Retirement_Home_logo.png",
+    "DHS": "https://upload.wikimedia.org/wikipedia/commons/5/52/Seal_of_the_United_States_Department_of_Homeland_Security.svg",
+    "DOC": "https://upload.wikimedia.org/wikipedia/commons/e/e0/Seal_of_the_United_States_Department_of_Commerce.svg",
+    "DOD": "https://upload.wikimedia.org/wikipedia/commons/e/e0/Seal_of_the_United_States_Department_of_Defense_%282004%29.svg",
+    "DOE": "https://upload.wikimedia.org/wikipedia/commons/e/e0/United_States_Department_of_Energy_Seal.svg",
+    "DOI": "https://upload.wikimedia.org/wikipedia/commons/e/e3/Seal_of_the_United_States_Department_of_the_Interior.svg",
+    "DOL": "https://upload.wikimedia.org/wikipedia/commons/4/47/Seal_of_the_United_States_Department_of_Labor.svg",
+    "DOS": "https://upload.wikimedia.org/wikipedia/commons/1/1b/Seal_of_the_United_States_Department_of_State.svg",
+    "DOT": "https://upload.wikimedia.org/wikipedia/commons/8/88/Seal_of_the_United_States_Department_of_Transportation.svg",
+    "HHS": "https://upload.wikimedia.org/wikipedia/commons/0/03/Seal_of_the_U.S._Department_of_Health_and_Human_Services.svg",
+    "HUD": "https://upload.wikimedia.org/wikipedia/commons/6/6e/Seal_of_the_United_States_Department_of_Housing_and_Urban_Development.svg",
+    "NASA": "https://upload.wikimedia.org/wikipedia/commons/e/e5/NASA_logo.svg",
+    "NRC": "https://upload.wikimedia.org/wikipedia/commons/8/85/U.S._Nuclear_Regulatory_Commission_seal.svg",
+    "SSA": "https://upload.wikimedia.org/wikipedia/commons/6/6e/Social_Security_Administration_logo_%282019%29.svg",
+    "USDA": "https://upload.wikimedia.org/wikipedia/commons/0/0f/Seal_of_the_United_States_Department_of_Agriculture.svg",
+    "VA": "https://upload.wikimedia.org/wikipedia/commons/8/87/Seal_of_the_U.S._Department_of_Veterans_Affairs.svg",
+}
 def create_search_url_wikipedia(search_query):
     base_url = "https://www.wikipedia.org/search-redirect.php?family=wikipedia&language=en&search="
     return base_url + search_query.replace(' ', '+').replace('–', '%E2%80%93').replace('&', 'and')
 def parse_foia_xml(filename: str) -> Dict:
     try:
         tree = ET.parse(filename)
         root = tree.getroot()
         return
     for xml_file in xml_files:
+        file_name = xml_file[:-4]
         data = parse_foia_xml(xml_file)
         with st.expander(f"📋 {file_name} - {data['name']} ({data['abbr']})"):
+            if data['abbr'] in AGENCY_LOGOS:
+                st.image(
+                    AGENCY_LOGOS[data['abbr']],
+                    caption=f"{data['name']} Seal",
+                    width=100
+                )
+            else:
+                st.write("🖼️ No logo available for this agency yet.")
             st.write(f"📅 Fiscal Year: {data['fiscal_year']}")
             st.write(f"⏳ Pending at Start: {data['pending_start']}")
             st.write(f"📥 Received: {data['received']}")
     return results
 def main():
     AGENCIES = load_agencies_from_xml()
     st.title("Freedom of Information Act (FOIA) Explorer 🌍📊")
+    st.image(
+        "https://upload.wikimedia.org/wikipedia/en/e/e8/U.S._Commission_of_Fine_Arts_logo.png",
+        caption="Logo of the United States Commission of Fine Arts - Representing U.S. Government Transparency",
+        width=200
+    )
     st.write("""
     The Freedom of Information Act (FOIA) empowers individuals by granting access to previously unreleased information and documents controlled by the United States government. Championing transparency and accountability, FOIA serves as a foundation for democratic engagement and open government initiatives. 🎉✨
     Below is a list of datasets available under FOIA, alongside guessed Wikipedia URLs for more information. 📚🔍
     - [Data.Gov](https://catalog.data.gov/dataset?tags=foia)
     """)
     datasets = [
         ("Provider Taxonomy", "🩺"),
         ("Consumer Complaint Database", "📞"),
     for dataset, emoji in datasets:
         st.markdown(f"- {emoji} **{dataset}**: [Wikipedia]({create_search_url_wikipedia(dataset)})")
     st.header("Agency Browser")
     agency_names = sorted(list(AGENCIES.keys()))
     selected_agency = st.selectbox("Select Agency", [""] + agency_names)
     if selected_agency:
         agency = Agency(AGENCIES[selected_agency])
         st.subheader(f"{agency.name} Details")
+        if agency.summary.get('abbreviation') in AGENCY_LOGOS:
+            st.image(
+                AGENCY_LOGOS[agency.summary.get('abbreviation')],
+                caption=f"{agency.name} Seal",
+                width=100
+            )
         st.write(f"Description: {agency.summary.get('description', 'N/A')}")
         st.write(f"Abbreviation: {agency.summary.get('abbreviation', 'N/A')}")
         if agency.website:
                         if "median" in key:
                             st.write(f"{key.replace('_median_days', '').title()}: {value} days")
     st.subheader("Search FOIA Documents")
     search_query = st.text_input("Enter search query")
     if st.button("Search") and search_query:
             for result in results["results"]:
                 st.write(f"- {result['title']} ({result['date']})")
     st.header("FOIA XML Reports")
     list_and_display_xml_files()