Spaces:

Rooobert
/

114-Learning-Project-APP

Running

App Files Files Community

Rooobert commited on 17 days ago

Commit

a33fe85

verified ·

1 Parent(s): 933be95

Update app.py

Browse files

Files changed (1) hide show

app.py +81 -152

app.py CHANGED Viewed

@@ -33,49 +33,24 @@ class SurveyMappings:
 class SurveyAnalyzer:
     """📊 問卷分析類"""
-    def __init__(self, df):
         self.mappings = SurveyMappings()
-        # Method to find the closest matching column
-        def find_matching_column(possible_columns):
-            for col in possible_columns:
-                # Try different variations of potential column names
-                variations = [
-                    col,
-                    col.replace('：', ''),
-                    col.replace('．', ''),
-                    col.strip()
-                ]
-                for var in variations:
-                    if var in df.columns:
-                        return var
-            return None
-        # Predefined column templates
-        column_templates = [
-            ('多元課程與活動', ['示範場域提供多元的數位課程與活動', '１： 示範場域提供多元的數位課程與活動']),
-            ('生活應用有幫助', ['示範場域的數位課程與活動對我的生活應用有幫助', '２．示範場域的數位課程與活動對我的生活應用有幫助']),
-            ('服務人員親切', ['示範場域的服務人員親切有禮貌', '３： 示範場域的服務人員親切有禮貌']),
-            ('空間設備友善', ['示範場域的服務空間與數位設備友善方便', '４．示範場域的服務空間與數位設備友善方便']),
-            ('獲得需要協助', ['在示範場域可以獲得需要的協助', '５．在示範場域可以獲得需要的協助']),
-            ('整體服務滿意', ['對於示範場域的服務感到滿意', '６．對於示範場域的服務感到滿意'])
         ]
-        # Find matching columns
-        self.satisfaction_short_names = []
-        self.satisfaction_columns = []
-        for short_name, column_options in column_templates:
-            matched_col = None
-            for col_option in column_options:
-                matched_col = find_matching_column([col_option])
-                if matched_col:
-                    self.satisfaction_columns.append(matched_col)
-                    self.satisfaction_short_names.append(short_name)
-                    break
-            if not matched_col:
-                st.warning(f"Could not find column for {short_name}")
     def calculate_age(self, birth_year_column):
         """🔢 計算年齡（從民國年到實際年齡）"""
@@ -96,48 +71,14 @@ class SurveyAnalyzer:
     def generate_report(self, df: pd.DataFrame) -> Dict[str, Any]:
         """📝 生成問卷調查報告"""
         # 計算年齡
-        age_column = '２．出生年（民國__年）'
-        # 找到最接近的年齡欄位
-        possible_age_columns = [
-            '２．出生年（民國__年）',
-            '出生年',
-            '出生年（民國__年）'
-        ]
-        for col in possible_age_columns:
-            if col in df.columns:
-                age_column = col
-                break
-        ages = self.calculate_age(df[age_column])
         # 取得教育程度分布（帶計數單位）
-        education_column = '３．教育程度'
-        # 找到最接近的教育程度欄位
-        possible_education_columns = [
-            '３．教育程度',
-            '教育程度'
-        ]
-        for col in possible_education_columns:
-            if col in df.columns:
-                education_column = col
-                break
-        education_counts = df[education_column].value_counts().to_dict()
         education_with_counts = {k: f"{v}人" for k, v in education_counts.items()}
         # 性別分布（帶計數單位）
-        gender_column = '1.   性別'
-        # 找到最接近的性別欄位
-        possible_gender_columns = [
-            '1.   性別',
-            '性別'
-        ]
-        for col in possible_gender_columns:
-            if col in df.columns:
-                gender_column = col
-                break
-        gender_counts = df[gender_column].value_counts().to_dict()
         gender_with_counts = {k: f"{v}人" for k, v in gender_counts.items()}
         # 計算每個滿意度項目的平均分數和標準差
@@ -209,38 +150,13 @@ class SurveyAnalyzer:
         """🟠 性別分佈圓餅圖（使用藍色和紅色）"""
         # 過濾數據
         filtered_df = df.copy()
-        # 場域篩選
-        venue_column = '場域名稱'
-        possible_venue_columns = ['場域名稱', 'venue']
-        for col in possible_venue_columns:
-            if col in filtered_df.columns:
-                venue_column = col
-                break
         if venues and '全部' not in venues:
-            filtered_df = filtered_df[filtered_df[venue_column].isin(venues)]
-        # 月份篩選
-        month_column = '月份'
-        possible_month_columns = ['月份', 'month']
-        for col in possible_month_columns:
-            if col in filtered_df.columns:
-                month_column = col
-                break
         if month and month != '全部':
-            filtered_df = filtered_df[filtered_df[month_column] == month]
-        # 性別欄位
-        gender_column = '1.   性別'
-        possible_gender_columns = ['1.   性別', '性別']
-        for col in possible_gender_columns:
-            if col in filtered_df.columns:
-                gender_column = col
-                break
-        gender_counts = filtered_df[gender_column].value_counts().reset_index()
         gender_counts.columns = ['性別', '人數']
         # 計算百分比
@@ -273,60 +189,73 @@ class SurveyAnalyzer:
 # 🎨 Streamlit UI
 def main():
-    # 設置頁面配置
     st.set_page_config(
-        page_title="114年度樂齡學習數位示範體驗場域 服務滿意度調查分析報告",
-        page_icon="📊",
         layout="wide"
     )
-    # 添加標題和子標題
     st.markdown("""
-    # 114年度樂齡學習數位示範體驗場域 服務滿意度調查分析報告
-    ## 全面理解樂齡學習者數位服務體驗
-    本報告提供全面的問卷調查分析與視覺化圖表，深入剖析樂齡學習者參與數位示範場域服務的滿意情形。
-    透過詳細的統計分析和互動式圖表，我們旨在呈現樂齡學習者的服務體驗和需求洞察。
-    ### 報告製作單位
-    **國立中正大學高齡教育研究中心專案管理團隊**
-    """)
-    # 分隔線
-    st.markdown("---")
-    # 上傳 CSV 檔案
-    uploaded_file = st.file_uploader("上傳 CSV 檔案", type=['csv'])
-    # 初始化數據和分析器
-    df = None
-    analyzer = None
-    # 檢查是否有上傳檔案
-    if uploaded_file is not None:
-        try:
-            df = pd.read_csv(uploaded_file, encoding='utf-8')
-            st.success("CSV 檔案上傳成功！")
-        except Exception as e:
-            st.error(f"無法讀取檔案：{e}")
-            return
-    # 如果沒有上傳檔案，提供使用預設數據的選項
-    if df is None:
-        if st.button('使用預設範例數據'):
-            df = read_google_sheet(sheet_id, gid)
-            if df is None:
-                st.error("無法讀取預設數據，請上傳 CSV 檔案")
-                return
-    # 如果有數據，則進行分析
-    if df is not None:
-        analyzer = SurveyAnalyzer(df)
-        # 新增場域和月份篩選器
-        st.sidebar.header("🔍 數據篩選")
-        # 場域篩選
-        venue_column = '場域名稱'
-        possible_venue_columns = ['場域名稱', 'venue']

 class SurveyAnalyzer:
     """📊 問卷分析類"""
+    def __init__(self):
         self.mappings = SurveyMappings()
+        self.satisfaction_columns = [
+            '１． 示範場域提供多元的數位課程與活動',
+            '２．示範場域的數位課程與活動對我的生活應用有幫助',
+            '３． 示範場域的服務人員親切有禮貌',
+            '４．示範場域的服務空間與數位設備友善方便',
+            '５．在示範場域可以獲得需要的協助',
+            '６．對於示範場域的服務感到滿意'
+        ]
+        self.satisfaction_short_names = [
+            '多元課程與活動',
+            '生活應用有幫助',
+            '服務人員親切',
+            '空間設備友善',
+            '獲得需要協助',
+            '整體服務滿意'
         ]
     def calculate_age(self, birth_year_column):
         """🔢 計算年齡（從民國年到實際年齡）"""
     def generate_report(self, df: pd.DataFrame) -> Dict[str, Any]:
         """📝 生成問卷調查報告"""
         # 計算年齡
+        ages = self.calculate_age(df['２．出生年（民國__年）'])
         # 取得教育程度分布（帶計數單位）
+        education_counts = df['３．教育程度'].value_counts().to_dict()
         education_with_counts = {k: f"{v}人" for k, v in education_counts.items()}
         # 性別分布（帶計數單位）
+        gender_counts = df['1.   性別'].value_counts().to_dict()
         gender_with_counts = {k: f"{v}人" for k, v in gender_counts.items()}
         # 計算每個滿意度項目的平均分數和標準差
         """🟠 性別分佈圓餅圖（使用藍色和紅色）"""
         # 過濾數據
         filtered_df = df.copy()
         if venues and '全部' not in venues:
+            filtered_df = filtered_df[filtered_df['場域名稱'].isin(venues)]
         if month and month != '全部':
+            # 假設有一個月份欄位，如果沒有請調整
+            filtered_df = filtered_df[filtered_df['月份'] == month]
+        gender_counts = filtered_df['1.   性別'].value_counts().reset_index()
         gender_counts.columns = ['性別', '人數']
         # 計算百分比
 # 🎨 Streamlit UI
 def main():
     st.set_page_config(
+        page_title="樂齡學習數位示範體驗場域 服務滿意度調查",
+        page_icon="📊",
         layout="wide"
     )
     st.markdown("""
+    # 📊 114年度樂齡學習數位示範體驗場域
+    ## 服務滿意度調查分析報告
+    *國立中正大學高齡教育研究中心專案管理團隊 精心製作*
+    本報告提供全面的問卷調查分析與視覺化圖表，深入剖析樂齡學習者參與數位示範場域服務的滿意情形。透過精細的數據分析，我們旨在瞭解高齡學習者的服務體驗，並為未來數位學習環境的優化提供寶貴洞見。
+    """, unsafe_allow_html=True)
+    # 讀取數據
+    df = read_google_sheet(sheet_id, gid)
+    if df is not None:
+        analyzer = SurveyAnalyzer()
+        # 新增場域和月份篩選器
+        st.sidebar.header("🔍 數據篩選")
+        # 假設數據有「場域名稱」欄位，如果名稱不同請調整
+        if '場域名稱' in df.columns:
+            venues = ['全部'] + sorted(df['場域名稱'].unique().tolist())
+            selected_venues = st.sidebar.multiselect("選擇場域", venues, default=['全部'])
+        else:
+            # 如果沒有場域欄位，創建10個虛擬場域供選擇
+            venues = ['全部'] + [f'場域{i+1}' for i in range(10)]
+            selected_venues = st.sidebar.multiselect("選擇場域", venues, default=['全部'])
+        # 假設數據有「月份」欄位，如果沒有請調整
+        if '月份' in df.columns:
+            months = ['全部'] + sorted(df['月份'].unique().tolist())
+            selected_month = st.sidebar.selectbox("選擇月份", months)
+        else:
+            # 如果沒有月份欄位，可以創建虛擬月份選項
+            months = ['全部'] + [f'{i+1}月' for i in range(12)]
+            selected_month = st.sidebar.selectbox("選擇月份", months)
+        # 📌 基本統計數據
+        st.sidebar.header("📌 選擇數據分析")
+        selected_analysis = st.sidebar.radio("選擇要查看的��析",
+                                             ["📋 問卷統計報告", "📊 滿意度統計", "🟠 性別分佈"])
+        if selected_analysis == "📋 問卷統計報告":
+            st.header("📋 問卷統計報告")
+            report = analyzer.generate_report(df)
+            for category, stats in report.items():
+                with st.expander(f"🔍 {category}", expanded=True):
+                    for key, value in stats.items():
+                        if key == '各項滿意度':
+                            st.write(f"**{key}:**")
+                            for item, item_stats in value.items():
+                                st.write(f"  - **{item}**: {', '.join([f'{k}: {v}' for k, v in item_stats.items()])}")
+                        else:
+                            st.write(f"**{key}**: {value}")
+        elif selected_analysis == "📊 滿意度統計":
+            st.header("📊 滿意度統計")
+            analyzer.plot_satisfaction_scores(df)
+        elif selected_analysis == "🟠 性別分佈":
+            st.header("🟠 性別分佈")
+            analyzer.plot_gender_distribution(df, selected_venues, selected_month)
+if __name__ == "__main__":
+    main()