Spaces:

blockenters
/

healthcare-app

Running

App Files Files Community

blockenters commited on Jan 28

Commit

0de191c

1 Parent(s): f3cadeb

add

Browse files

Files changed (4) hide show

app.py +99 -30
models/healthcare_model.pkl +0 -3
models/sample.txt +0 -0
requirements.txt +0 -5

app.py CHANGED Viewed

@@ -3,7 +3,15 @@
 import streamlit as st
 import pandas as pd
 import joblib
-import os
 # 모델 로드
 @st.cache_resource
@@ -11,38 +19,99 @@ def load_model():
     model = joblib.load('models/healthcare_model.pkl')
     return model
 def main():
-    st.title('의료 보험 청구액 예측 서비스')
-    # 사이드바에 입력 폼 생성
-    st.sidebar.header('환자 정보 입력')
-    age = st.sidebar.number_input('나이', min_value=0, max_value=100, value=30)
-    gender = st.sidebar.selectbox('성별', ['Male', 'Female'])
-    bmi = st.sidebar.number_input('BMI', min_value=10.0, max_value=50.0, value=25.0)
-    region = st.sidebar.selectbox('지역', ['North', 'South', 'East', 'West'])
-    smoker = st.sidebar.selectbox('흡연 여부', ['Yes', 'No'])
-    num_visits = st.sidebar.number_input('방문 횟수', min_value=0, max_value=20, value=5)
-    # 예측 버튼
-    if st.sidebar.button('예측하기'):
-        # 입력 데이터 구성
-        input_data = {
-            'Age': age,
-            'Gender': gender,
-            'BMI': bmi,
-            'Region': region,
-            'Smoker': smoker,
-            'NumVisits': num_visits
-        }
-        # 모델 로드 및 예측
-        model = load_model()
-        prediction = predict_insurance_claim(input_data, model)
-        # 결과 표시
-        st.header('예측 결과')
-        st.write(f'예상 보험 청구액: ${prediction:,.2f}')
 def predict_insurance_claim(data, pipeline):
     new_df = pd.DataFrame([data])

 import streamlit as st
 import pandas as pd
 import joblib
+import plotly.express as px
+import numpy as np
+# 데이터 로드
+@st.cache_data
+def load_data():
+    df = pd.read_csv('data/healthcare.csv', index_col=0)
+    return df
 # 모델 로드
 @st.cache_resource
     model = joblib.load('models/healthcare_model.pkl')
     return model
+def create_charts(df):
+    st.header('📊 데이터 분석')
+    # 1. 흡연 여부에 따른 보험 청구액 분포
+    st.subheader('흡연 여부에 따른 보험 청구액 분포')
+    fig = px.box(df, x='Smoker', y='InsuranceClaim', color='Smoker')
+    st.plotly_chart(fig)
+    # 2. 나이와 보험 청구액의 관계
+    st.subheader('나이와 보험 청구액의 관계')
+    fig = px.scatter(df, x='Age', y='InsuranceClaim', color='Gender',
+                    title='나이별 보험 청구액 분포',
+                    labels={'InsuranceClaim': '보험 청구액', 'Age': '나이'})
+    st.plotly_chart(fig)
+    # 3. BMI 구간별 평균 보험 청구액
+    st.subheader('BMI 구간별 평균 보험 청구액')
+    df['BMI_Category'] = pd.cut(df['BMI'],
+                               bins=[0, 18.5, 25, 30, 100],
+                               labels=['저체중', '정상', '과체중', '비만'])
+    bmi_avg = df.groupby('BMI_Category')['InsuranceClaim'].mean().reset_index()
+    fig = px.bar(bmi_avg, x='BMI_Category', y='InsuranceClaim',
+                 title='BMI 구간별 평균 보험 청구액',
+                 labels={'InsuranceClaim': '평균 보험 청구액', 'BMI_Category': 'BMI 구간'})
+    st.plotly_chart(fig)
+    # 4. 지역별 평균 보험 청구액
+    st.subheader('지역별 평균 보험 청구액')
+    region_avg = df.groupby('Region')['InsuranceClaim'].mean().reset_index()
+    fig = px.pie(region_avg, values='InsuranceClaim', names='Region',
+                 title='지역별 평균 보험 청구액 비율')
+    st.plotly_chart(fig)
+    # 5. 주요 통계 지표
+    st.subheader('💡 주요 통계 지표')
+    col1, col2, col3 = st.columns(3)
+    with col1:
+        st.metric("평균 보험 청구액", f"${df['InsuranceClaim'].mean():,.2f}")
+    with col2:
+        st.metric("최대 보험 청구액", f"${df['InsuranceClaim'].max():,.2f}")
+    with col3:
+        st.metric("최소 보험 청구액", f"${df['InsuranceClaim'].min():,.2f}")
 def main():
+    st.title('🏥 의료 보험 청구액 예측 서비스')
+    # 데이터 로드
+    df = load_data()
+    # 탭 생성
+    tab1, tab2 = st.tabs(["예측하기", "데이터 분석"])
+    with tab1:
+        # 사이드바에 입력 폼 생성
+        st.sidebar.header('환자 정보 입력')
+        age = st.sidebar.number_input('나이', min_value=0, max_value=100, value=30)
+        gender = st.sidebar.selectbox('성별', ['Male', 'Female'])
+        bmi = st.sidebar.number_input('BMI', min_value=10.0, max_value=50.0, value=25.0)
+        region = st.sidebar.selectbox('지역', ['North', 'South', 'East', 'West'])
+        smoker = st.sidebar.selectbox('흡연 여부', ['Yes', 'No'])
+        num_visits = st.sidebar.number_input('방문 횟수', min_value=0, max_value=20, value=5)
+        # 예측 버튼
+        if st.sidebar.button('예측하기'):
+            # 입력 데이터 구성
+            input_data = {
+                'Age': age,
+                'Gender': gender,
+                'BMI': bmi,
+                'Region': region,
+                'Smoker': smoker,
+                'NumVisits': num_visits
+            }
+            # 모델 로드 및 예측
+            model = load_model()
+            prediction = predict_insurance_claim(input_data, model)
+            # 결과 표시
+            st.header('예측 결과')
+            st.write(f'예상 보험 청구액: ${prediction:,.2f}')
+            # 예측 결과 설명
+            st.info("""
+            💡 예측 결과 설명:
+            - 이 예측은 환자의 기본 정보를 바탕으로 계산되었습니다.
+            - 실제 청구액은 구체적인 진료 내용에 따라 달라질 수 있습니다.
+            - 이 예측은 참고용으로만 사용해주세요.
+            """)
+    with tab2:
+        create_charts(df)
 def predict_insurance_claim(data, pipeline):
     new_df = pd.DataFrame([data])

models/healthcare_model.pkl DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:a2cc7436c6162d93b08225a39337c511b12374b3618a3d21dd2332c30043a979
-size 4362

models/sample.txt DELETED Viewed

File without changes

requirements.txt DELETED Viewed

@@ -1,5 +0,0 @@
-streamlit
-scikit-learn
-pandas
-joblib
-numpy