Spaces:

Rooobert
/

114-Learning-Project-APP

Sleeping

App Files Files Community

Rooobert commited on Mar 5

Commit

933be95

verified ·

1 Parent(s): 278bb6a

Update app.py

Browse files

Files changed (1) hide show

app.py +132 -208

app.py CHANGED Viewed

@@ -1,114 +1,4 @@
-def main():
-    # 設置頁面配置
-    st.set_page_config(
-        page_title="114年度樂齡學習數位示範體驗場域 服務滿意度調查分析報告",
-        page_icon="📊",
-        layout="wide"
-    )
-    # 添加標題和子標題
-    st.markdown("""
-    # 114年度樂齡學習數位示範體驗場域 服務滿意度調查分析報告
-    ## 全面理解樂齡學習者數位服務體驗
-    本報告提供全面的問卷調查分析與視覺化圖表，深入剖析樂齡學習者參與數位示範場域服務的滿意情形。
-    透過詳細的統計分析和互動式圖表，我們旨在呈現樂齡學習者的服務體驗和需求洞察。
-    ### 報告製作單位
-    **國立中正大學高齡教育研究中心專案管理團隊**
-    """)
-    # 分隔線
-    st.markdown("---")
-    # 上傳 CSV 檔案
-    uploaded_file = st.file_uploader("上傳 CSV 檔案", type=['csv'])
-    # 預設數據按鈕
-    use_default_data = st.button('使用預設範例數據')
-    # 數據載入和處理
-    df = None
-    analyzer = None
-    if uploaded_file is not None:
-        # 讀取上傳的 CSV 檔案
-        try:
-            df = pd.read_csv(uploaded_file, encoding='utf-8')
-            st.success("CSV 檔案上傳成功！")
-        except Exception as e:
-            st.error(f"無法讀取檔案：{e}")
-            return
-    elif use_default_data:
-        # 使用預設數據
-        df = read_google_sheet(sheet_id, gid)
-        if df is None:
-            st.error("無法讀取預設數據，請上傳 CSV 檔案")
-            return
-    # 如果有數據，則進行分析
-    if df is not None:
-        analyzer = SurveyAnalyzer()
-        # 新增場域和月份篩選器
-        st.sidebar.header("🔍 數據篩選")
-        # 假設數據有「場域名稱」欄位，如果名稱不同請調整
-        if '場域名稱' in df.columns:
-            venues = ['全部'] + sorted(df['場域名稱'].unique().tolist())
-            selected_venues = st.sidebar.multiselect("選擇場域", venues, default=['全部'])
-        else:
-            # 如果沒有場域欄位，創建10個虛擬場域供選擇
-            venues = ['全部'] + [f'場域{i+1}' for i in range(10)]
-            selected_venues = st.sidebar.multiselect("選擇場域", venues, default=['全部'])
-        # 假設數據有「月份」欄位，如果沒有請調整
-        if '月份' in df.columns:
-            months = ['全部'] + sorted(df['月份'].unique().tolist())
-            selected_month = st.sidebar.selectbox("選擇月份", months)
-        else:
-            # 如果沒有月份欄位，可以創建虛擬月份選項
-            months = ['全部'] + [f'{i+1}月' for i in range(12)]
-            selected_month = st.sidebar.selectbox("選擇月份", months)
-        # 📌 基本統計數據
-        st.sidebar.header("📌 選擇數據分析")
-        selected_analysis = st.sidebar.radio("選擇要查看的分析",
-                                             ["📋 問卷統計報告", "📊 滿意度統計", "🟠 性別分佈"])
-        if selected_analysis == "📋 問卷統計報告":
-            st.header("📋 問卷統計報告")
-            report = analyzer.generate_report(df)
-            for category, stats in report.items():
-                with st.expander(f"🔍 {category}", expanded=True):
-                    for key, value in stats.items():
-                        if key == '各項滿意度':
-                            st.write(f"**{key}:**")
-                            for item, item_stats in value.items():
-                                st.write(f"  - **{item}**: {', '.join([f'{k}: {v}' for k, v in item_stats.items()])}")
-                        else:
-                            st.write(f"**{key}**: {value}")
-        elif selected_analysis == "📊 滿意度統計":
-            st.header("📊 滿意度統計")
-            analyzer.plot_satisfaction_scores(df)
-        elif selected_analysis == "🟠 性別分佈":
-            st.header("🟠 性別分佈")
-            analyzer.plot_gender_distribution(df, selected_venues, selected_month)
-        # 報告說明
-        st.markdown("---")
-        st.markdown("""
-        ### 報告說明
-        - **數據來源**：114年度樂齡學習數位示範體驗場域調查問卷
-        - **分析目的**：評估樂齡學習者對數位示範場域服務的滿意度
-        - **報告解讀**：本報告提供服務滿意度的客觀量化指標，旨在協助改進服務品質
-        """)
-    else:
-        st.info("請上傳 CSV 檔案或使用預設範例數據")import streamlit as st
 import pandas as pd
 import plotly.express as px
 import numpy as np
@@ -143,25 +33,50 @@ class SurveyMappings:
 class SurveyAnalyzer:
     """📊 問卷分析類"""
-    def __init__(self):
         self.mappings = SurveyMappings()
-        self.satisfaction_columns = [
-            '１． 示範場域提供多元的數位課程與活動',
-            '２．示範場域的數位課程與活動對我的生活應用有幫助',
-            '３： 示範場域的服務人員親切有禮貌',
-            '４．示範場域的服務空間與數位設備友善方便',
-            '５．在示範場域可以獲得需要的協助',
-            '６．對於示範場域的服務感到滿意'
-        ]
-        self.satisfaction_short_names = [
-            '多元課程與活動',
-            '生活應用有幫助',
-            '服務人員親切',
-            '空間設備友善',
-            '獲得需要協助',
-            '整體服務滿意'
         ]
     def calculate_age(self, birth_year_column):
         """🔢 計算年齡（從民國年到實際年齡）"""
         # 獲取當前年份（西元年）
@@ -181,14 +96,48 @@ class SurveyAnalyzer:
     def generate_report(self, df: pd.DataFrame) -> Dict[str, Any]:
         """📝 生成問卷調查報告"""
         # 計算年齡
-        ages = self.calculate_age(df['２．出生年（民國__年）'])
         # 取得教育程度分布（帶計數單位）
-        education_counts = df['３．教育程度'].value_counts().to_dict()
         education_with_counts = {k: f"{v}人" for k, v in education_counts.items()}
         # 性別分布（帶計數單位）
-        gender_counts = df['1.   性別'].value_counts().to_dict()
         gender_with_counts = {k: f"{v}人" for k, v in gender_counts.items()}
         # 計算每個滿意度���目的平均分數和標準差
@@ -260,13 +209,38 @@ class SurveyAnalyzer:
         """🟠 性別分佈圓餅圖（使用藍色和紅色）"""
         # 過濾數據
         filtered_df = df.copy()
         if venues and '全部' not in venues:
-            filtered_df = filtered_df[filtered_df['場域名稱'].isin(venues)]
         if month and month != '全部':
-            # 假設有一個月份欄位，如果沒有請調整
-            filtered_df = filtered_df[filtered_df['月份'] == month]
-        gender_counts = filtered_df['1.   性別'].value_counts().reset_index()
         gender_counts.columns = ['性別', '人數']
         # 計算百分比
@@ -324,85 +298,35 @@ def main():
     # 上傳 CSV 檔案
     uploaded_file = st.file_uploader("上傳 CSV 檔案", type=['csv'])
     if uploaded_file is not None:
-        # 讀取上傳的 CSV 檔案
         try:
             df = pd.read_csv(uploaded_file, encoding='utf-8')
-            # 儲存到 session state，以便在其他函數中使用
-            st.session_state['uploaded_file'] = uploaded_file
-            # 創建分析器
-            analyzer = SurveyAnalyzer()
-    elif st.button('使用預設範例數據'):
-        # 如果沒有上傳檔案，提供預設數據讀取
-        df = read_google_sheet(sheet_id, gid)
-        if df is None:
-            st.error("無法讀取預設數據，請上傳 CSV 檔案")
-            return
-        analyzer = SurveyAnalyzer()
-    else:
-        st.info("請上傳 CSV 檔案或使用預設範例數據")
-        return
         # 新增場域和月份篩選器
         st.sidebar.header("🔍 數據篩選")
-        # 假設數據有「場域名稱」欄位，如果名稱不同請調整
-        if '場域名稱' in df.columns:
-            venues = ['全部'] + sorted(df['場域名稱'].unique().tolist())
-            selected_venues = st.sidebar.multiselect("選擇場域", venues, default=['全部'])
-        else:
-            # 如果沒有場域欄位，創建10個虛擬場域供選擇
-            venues = ['全部'] + [f'場域{i+1}' for i in range(10)]
-            selected_venues = st.sidebar.multiselect("選擇場域", venues, default=['全部'])
-        # 假設數據有「月份」欄位，如果沒有請調整
-        if '月份' in df.columns:
-            months = ['全部'] + sorted(df['月份'].unique().tolist())
-            selected_month = st.sidebar.selectbox("選擇月份", months)
-        else:
-            # 如果沒有月份欄位，可以創建虛擬月份選項
-            months = ['全部'] + [f'{i+1}月' for i in range(12)]
-            selected_month = st.sidebar.selectbox("選擇月份", months)
-        # 📌 基本統計數據
-        st.sidebar.header("📌 選擇數據分析")
-        selected_analysis = st.sidebar.radio("選擇要查看的分析",
-                                             ["📋 問卷統計報告", "📊 滿意度統計", "🟠 性別分佈"])
-        if selected_analysis == "📋 問卷統計報告":
-            st.header("📋 問卷統計報告")
-            report = analyzer.generate_report(df)
-            for category, stats in report.items():
-                with st.expander(f"🔍 {category}", expanded=True):
-                    for key, value in stats.items():
-                        if key == '各項滿意度':
-                            st.write(f"**{key}:**")
-                            for item, item_stats in value.items():
-                                st.write(f"  - **{item}**: {', '.join([f'{k}: {v}' for k, v in item_stats.items()])}")
-                        else:
-                            st.write(f"**{key}**: {value}")
-        elif selected_analysis == "📊 滿意度統計":
-            st.header("📊 滿意度統計")
-            analyzer.plot_satisfaction_scores(df)
-        elif selected_analysis == "🟠 性別分佈":
-            st.header("🟠 性別分佈")
-            analyzer.plot_gender_distribution(df, selected_venues, selected_month)
-        # 報告說明
-        st.markdown("---")
-        st.markdown("""
-        ### 報告說明
-        - **數據來源**：114年度樂齡學習數位示範體驗場域調查問卷
-        - **分析目的**：評估樂齡學習者對數位示範場域服務的滿意度
-        - **報告解讀**：本報告提供服務滿意度的客觀量化指標，旨在協助改進服務品質
-        """)
-if __name__ == "__main__":
-    main()

+import streamlit as st
 import pandas as pd
 import plotly.express as px
 import numpy as np
 class SurveyAnalyzer:
     """📊 問卷分析類"""
+    def __init__(self, df):
         self.mappings = SurveyMappings()
+        # Method to find the closest matching column
+        def find_matching_column(possible_columns):
+            for col in possible_columns:
+                # Try different variations of potential column names
+                variations = [
+                    col,
+                    col.replace('：', ''),
+                    col.replace('．', ''),
+                    col.strip()
+                ]
+                for var in variations:
+                    if var in df.columns:
+                        return var
+            return None
+        # Predefined column templates
+        column_templates = [
+            ('多元課程與活動', ['示範場域提供多元的數位課程與活動', '１： 示範場域提供多元的數位課程與活動']),
+            ('生活應用有幫助', ['示範場域的數位課程與活動對我的生活應用有幫助', '２．示範場域的數位課程與活動對我的生活應用有幫助']),
+            ('服務人員親切', ['示範場域的服務人員親切有禮貌', '３： 示範場域的服務人員親切有禮貌']),
+            ('空間設備友善', ['示範場域的服務空間與數位設備友善方便', '４．示範場域的服務空間與數位設備友善方便']),
+            ('獲得需要協助', ['在示範場域可以獲得需要的協助', '５．在示範場域可以獲得需要的協助']),
+            ('整體服務滿意', ['對於示範場域的服務感到滿意', '６．對於示範場域的服務感到滿意'])
         ]
+        # Find matching columns
+        self.satisfaction_short_names = []
+        self.satisfaction_columns = []
+        for short_name, column_options in column_templates:
+            matched_col = None
+            for col_option in column_options:
+                matched_col = find_matching_column([col_option])
+                if matched_col:
+                    self.satisfaction_columns.append(matched_col)
+                    self.satisfaction_short_names.append(short_name)
+                    break
+            if not matched_col:
+                st.warning(f"Could not find column for {short_name}")
     def calculate_age(self, birth_year_column):
         """🔢 計算年齡（從民國年到實際年齡）"""
         # 獲取當前年份（西元年）
     def generate_report(self, df: pd.DataFrame) -> Dict[str, Any]:
         """📝 生成問卷調查報告"""
         # 計算年齡
+        age_column = '２．出生年（民國__年）'
+        # 找到最接近的年齡欄位
+        possible_age_columns = [
+            '２．出生年（民國__年）',
+            '出生年',
+            '出生年（民國__年）'
+        ]
+        for col in possible_age_columns:
+            if col in df.columns:
+                age_column = col
+                break
+        ages = self.calculate_age(df[age_column])
         # 取得教育程度分布（帶計數單位）
+        education_column = '３．教育程度'
+        # 找到最接近的教育程度欄位
+        possible_education_columns = [
+            '３．教育程度',
+            '教育程度'
+        ]
+        for col in possible_education_columns:
+            if col in df.columns:
+                education_column = col
+                break
+        education_counts = df[education_column].value_counts().to_dict()
         education_with_counts = {k: f"{v}人" for k, v in education_counts.items()}
         # 性別分布（帶計數單位）
+        gender_column = '1.   性別'
+        # 找到最接近的性別欄位
+        possible_gender_columns = [
+            '1.   性別',
+            '性別'
+        ]
+        for col in possible_gender_columns:
+            if col in df.columns:
+                gender_column = col
+                break
+        gender_counts = df[gender_column].value_counts().to_dict()
         gender_with_counts = {k: f"{v}人" for k, v in gender_counts.items()}
         # 計算每個滿意度���目的平均分數和標準差
         """🟠 性別分佈圓餅圖（使用藍色和紅色）"""
         # 過濾數據
         filtered_df = df.copy()
+        # 場域篩選
+        venue_column = '場域名稱'
+        possible_venue_columns = ['場域名稱', 'venue']
+        for col in possible_venue_columns:
+            if col in filtered_df.columns:
+                venue_column = col
+                break
         if venues and '全部' not in venues:
+            filtered_df = filtered_df[filtered_df[venue_column].isin(venues)]
+        # 月份篩選
+        month_column = '月份'
+        possible_month_columns = ['月份', 'month']
+        for col in possible_month_columns:
+            if col in filtered_df.columns:
+                month_column = col
+                break
         if month and month != '全部':
+            filtered_df = filtered_df[filtered_df[month_column] == month]
+        # 性別欄位
+        gender_column = '1.   性別'
+        possible_gender_columns = ['1.   性別', '性別']
+        for col in possible_gender_columns:
+            if col in filtered_df.columns:
+                gender_column = col
+                break
+        gender_counts = filtered_df[gender_column].value_counts().reset_index()
         gender_counts.columns = ['性別', '人數']
         # 計算百分比
     # 上傳 CSV 檔案
     uploaded_file = st.file_uploader("上傳 CSV 檔案", type=['csv'])
+    # 初始化數據和分析器
+    df = None
+    analyzer = None
+    # 檢查是否有上傳檔案
     if uploaded_file is not None:
         try:
             df = pd.read_csv(uploaded_file, encoding='utf-8')
+            st.success("CSV 檔案上傳成功！")
+        except Exception as e:
+            st.error(f"無法讀取檔案：{e}")
+            return
+    # 如果沒有上傳檔案，提供使用預設數據的選項
+    if df is None:
+        if st.button('使用預設範例數據'):
+            df = read_google_sheet(sheet_id, gid)
+            if df is None:
+                st.error("無法讀取預設數據，請上傳 CSV 檔案")
+                return
+    # 如果有數據，則進行分析
+    if df is not None:
+        analyzer = SurveyAnalyzer(df)
         # 新增場域和月份篩選器
         st.sidebar.header("🔍 數據篩選")
+        # 場域篩選
+        venue_column = '場域名稱'
+        possible_venue_columns = ['場域名稱', 'venue']