Spaces:

pcreem
/

brown-cafe

Sleeping

App Files Files Community

Song commited on 21 days ago

Commit

9e85da1

1 Parent(s): b20c534

hi

Browse files

Files changed (1) hide show

app.py +279 -610

app.py CHANGED Viewed

@@ -27,6 +27,7 @@ for d in (os.getenv("HF_HOME"), os.getenv("SENTENCE_TRANSFORMERS_HOME"), os.gete
 # ---------- Imports ----------
 import re, hmac, base64, hashlib, pickle, logging, time, json
 from typing import List, Dict, Any, Optional, Tuple, Union
 import numpy as np
 import pandas as pd
@@ -38,659 +39,323 @@ except Exception:
     torch = None
 try:
-    import faiss  # type: ignore
-except Exception as e:
-    raise RuntimeError(f"faiss not available: {e}")
 try:
-    from sentence_transformers import SentenceTransformer, CrossEncoder  # type: ignore
 except Exception:
     SentenceTransformer = None
 try:
-    from rank_bm25 import BM25Okapi  # type: ignore
 except Exception:
     BM25Okapi = None
-try:
-    import jieba  # type: ignore
-except Exception:
-    jieba = None
-try:
-    from fuzzywuzzy import fuzz  # type: ignore
-except Exception:
-    fuzz = None
-try:
-    import requests  # type: ignore
-except Exception:
-    requests = None
-from fastapi import FastAPI, HTTPException, Header, Request
-# ---------- Logging ----------
-LOG_LEVEL = (os.getenv("LOG_LEVEL") or "INFO").upper()
-logging.basicConfig(level=LOG_LEVEL, format="%(asctime)s - %(levelname)s - %(message)s")
-log = logging.getLogger("app")
-# ---------- 只讀取你指定的 HF 環境變數 ----------
-CHANNEL_ACCESS_TOKEN = os.getenv("CHANNEL_ACCESS_TOKEN")
-CHANNEL_SECRET       = os.getenv("CHANNEL_SECRET")
-LITELLM_API_KEY      = os.getenv("LITELLM_API_KEY")
-LITELLM_BASE_URL     = os.getenv("LITELLM_BASE_URL")
-LM_MODEL             = os.getenv("LM_MODEL")
-# ---------- 檢索設定（固定常數） ----------
-TOP_K_SENTENCES   = 10
-BM25_WEIGHT       = 0.8
-SEM_WEIGHT        = 0.2
-EMBEDDING_MODEL_ID= "DMetaSoul/Dmeta-embedding-zh"
-RERANKER_MODEL_ID = "BAAI/bge-reranker-base"
-USE_CPU           = True  # HF 預設 CPU
-RERANK_THRESHOLD  = 0.5
-MAX_CONTEXT_CHARS = 8000
-DISCLAIMER = "此回覆僅供參考，請遵循醫師/藥師指示。"
-# 藥名映射與停用詞
-DRUG_NAME_MAPPING = {
-    "fentanyl patch": "fentanyl",
-    "spiriva respimat": "spiriva",
-    "augmentin for syrup": "augmentin syrup",
-    "nitrostat": "nitroglycerin",
-    "ozempic": "ozempic",
-    "niflec": "niflec",
-    "fosamax": "alendronate",
-    "humira": "adalimumab",
-    "premarin": "premarin",
-    "smecta": "smecta",
-    "duragesic": "fentanyl",
-    "芬太尼貼片": "fentanyl",
-    "透皮止痛貼片": "fentanyl",
-}
-DRUG_STOPWORDS = {"藥", "劑", "錠", "膠囊", "糖漿", "乳膏", "貼片", "含錠", "膜衣錠", "緩釋錠", "滴劑", "懸液", "注射液",
-                  "吸入劑", "噴霧", "噴霧劑", "吸入器", "注射筆", "藥水", "小袋", "條", "包", "瓶", "外用", "口服"}
-# 意圖分類（改用字典提升匹配率）
-INTENT_KEYWORDS = {
-    "如何用藥 (Administration)": ["操作", "使用", "怎麼用", "怎麼吃", "怎麼貼", "怎麼喝", "怎麼注射", "服用", "組裝", "安裝", "用藥方式"],
-    "保存/攜帶 (Storage & Handling)": ["保存", "儲存", "攜帶", "冷藏", "室溫", "潮濕", "保冰袋", "旅遊"],
-    "副作用/異常 (Side Effects / Issues)": ["副作用", "異常", "不良反應", "頭暈", "拉肚子", "噁心", "想吐", "過敏", "問題"],
-    "劑量調整 (Dosage Adjustment)": ["劑量", "幾顆", "調整", "忘記吃", "上限", "幾次", "劑量多少"],
-    "用藥時間 (Timing)": ["時間", "多久", "間隔", "飯前", "飯後", "隨餐", "睡前", "什麼時候"],
-    "禁忌症/適應症 (Contraindications/Indications)": ["禁忌", "適應症", "不能用", "不適合", "誰不能吃", "適合"],
-}
-# 章節權重
 SECTION_NORMALIZE = {
-  "用法用量": "用法及用量",
-  "副作用不良反應": "不良反應",
-  "警語注意事項": "警語及注意事項",
-  "交互作用": "藥物交互作用",
-  "包裝及儲存": "儲存條件",
-  "儲存條件": "儲存條件"
-}
-SECTION_WEIGHTS = {
-    "用法及用量": 1.0,
-    "病人使用須知": 1.0,
-    "儲存條件": 1.0,
-    "警語及注意事項": 1.0,
-    "禁忌": 1.0,
-    "副作用": 1.0,
-    "藥物交互作用": 1.0,
-    "其他": 1.0,
-    "包裝及儲存": 1.0,
-    "不良反應": 1.0,
 }
-IMPORTANT_SECTIONS = ["用法及用量", "病人使用須知", "包裝及儲存", "不良反應", "警語及注意事項"]
-# 移除 DOSAGE_FORM_BOOST
-# ---------- 路徑工具 ----------
-def pick_existing_or_tmp(candidates: List[str]) -> str:
-    for p in candidates:
-        if os.path.exists(p):
-            return p
-    base = os.path.basename(candidates[0])
-    fallback = os.path.join("/tmp", base)
-    pathlib.Path(fallback).parent.mkdir(parents=True, exist_ok=True)
-    return fallback
-def safe_pickle_dump(obj: Any, preferred_path: str) -> str:
-    try:
-        pathlib.Path(preferred_path).parent.mkdir(parents=True, exist_ok=True)
-        with open(preferred_path, "wb") as f:
-            pickle.dump(obj, f)
-        return preferred_path
-    except OSError as e:
-        if e.errno == errno.EACCES:
-            alt = os.path.join("/tmp", os.path.basename(preferred_path))
-            try:
-                with open(alt, "wb") as f:
-                    pickle.dump(obj, f)
-                log.warning("No write permission for %s, saved to %s instead.", preferred_path, alt)
-                return alt
-            except Exception as ee:
-                log.warning("Failed to save to /tmp as well: %s", ee)
-        else:
-            log.warning("pickle dump failed: %s", e)
-    except Exception as e:
-        log.warning("pickle dump failed: %s", e)
-    return ""
-def safe_faiss_write(index, preferred_path: str) -> str:
-    try:
-        pathlib.Path(preferred_path).parent.mkdir(parents=True, exist_ok=True)
-        faiss.write_index(index, preferred_path)
-        return preferred_path
-    except OSError as e:
-        if e.errno == errno.EACCES:
-            alt = os.path.join("/tmp", os.path.basename(preferred_path))
-            try:
-                faiss.write_index(index, alt)
-                log.warning("No write permission for %s, saved FAISS to %s instead.", preferred_path, alt)
-                return alt
-            except Exception as ee:
-                log.warning("Failed to save FAISS to /tmp as well: %s", ee)
-        else:
-            log.warning("faiss write failed: %s", e)
-    except Exception as e:
-        log.warning("faiss write failed: %s", e)
-    return ""
-# ---------- 檔案路徑（優先專案根目錄，其次 /app，最後 /tmp） ----------
-CWD = os.getcwd()
-SENTENCES_PKL = pick_existing_or_tmp([
-    os.path.join(CWD, "drug_sentences.pkl"),
-    "/app/drug_sentences.pkl",
-    "/tmp/drug_sentences.pkl",
-])
-FAISS_INDEX = pick_existing_or_tmp([
-    os.path.join(CWD, "drug_sentences.index"),
-    "/app/drug_sentences.index",
-    "/tmp/drug_sentences.index",
-])
-BM25_PKL = pick_existing_or_tmp([
-    os.path.join(CWD, "bm25.pkl"),
-    "/app/bm25.pkl",
-    "/tmp/bm25.pkl",
-])
-CSV_PATH = pick_existing_or_tmp([
-    os.path.join(CWD, "cleaned_combined.csv"),
-    "/app/cleaned_combined.csv",
-    "/tmp/cleaned_combined.csv",
-])
-# ---------- FastAPI ----------
-app = FastAPI(title="DrugQA (ZH) — LINE Webhook Only")
-# ---------- Helpers ----------
-_ZH_SPLIT_RE = re.compile(r"[。！？\n]")
-def split_sentences(text: str) -> List[str]:
-    if not isinstance(text, str): return []
-    sents = [s.strip() for s in _ZH_SPLIT_RE.split(text) if s.strip()]
-    return [s for s in sents if len(s) > 6]
-def tokenize_zh(s: str) -> List[str]:
-    if not isinstance(s, str) or not s: return []
-    if jieba is None: return s.strip().split()
-    return [t for t in jieba.lcut(s) if t.strip() and t not in DRUG_STOPWORDS]
-def detect_intent(query: str) -> List[str]:
-    """Detects user intent based on keywords."""
-    detected = []
-    query_lower = query.lower().replace(" ", "")
-    for intent, keywords in INTENT_KEYWORDS.items():
-        if any(k in query_lower for k in keywords):
-            detected.append(intent)
-    return detected
-class State:
-    sentences: List[str] = []
-    meta: List[Dict[str, Any]] = []
-    emb_model: Optional[Any] = None
-    reranker_model: Optional[Any] = None
-    faiss_index: Optional[Any] = None
-    bm25: Optional[Any] = None
-    df_csv: Optional[pd.DataFrame] = None
-    user_sessions: Dict[str, Dict[str, Any]] = {}
-    query_cache: Dict[str, Dict[str, Any]] = {}
-STATE = State()
-# ---------- 載入與建立 ----------
-def ensure_sentences_meta() -> Tuple[List[str], List[Dict[str, Any]]]:
     if os.path.exists(SENTENCES_PKL):
-        try:
-            with open(SENTENCES_PKL, "rb") as f:
-                obj = pickle.load(f)
-            sents = obj.get("sentences", []) if isinstance(obj, dict) else []
-            meta  = obj.get("meta", []) if isinstance(obj, dict) else []
-            log.info("Loaded sentences/meta: %s (n=%d)", SENTENCES_PKL, len(sents))
-            return sents, meta
-        except Exception as e:
-            log.warning("Failed to load sentences pkl (%s). Corpus will be empty.", e)
-    else:
-        log.info("Sentences pkl not found: %s", SENTENCES_PKL)
-    return [], []
 def load_embedding_model(model_id: str):
     if SentenceTransformer is None:
-        log.warning("sentence-transformers 不可用；僅以 BM25 檢索。")
         return None
-    device = "cpu" if (USE_CPU or (torch is None)) else ("cuda" if torch.cuda.is_available() else "cpu")
-    log.info("Load SentenceTransformer: %s on %s", model_id, device)
     try:
-        return SentenceTransformer(model_id, device=device)
     except Exception as e:
-        log.warning("Failed to load embedding model: %s", e)
         return None
 def load_reranker_model(model_id: str):
-    if CrossEncoder is None:
-        log.warning("CrossEncoder 不可用；略過 rerank。")
         return None
-    device = "cpu" if (USE_CPU or (torch is None)) else ("cuda" if torch.cuda.is_available() else "cpu")
-    log.info("Load CrossEncoder: %s on %s", model_id, device)
     try:
-        return CrossEncoder(model_id, device=device)
     except Exception as e:
-        log.warning("Failed to load reranker model: %s", e)
         return None
-def ensure_faiss(index_path: str, sentences: List[str]) -> Optional[Any]:
-    if not faiss: return None
-    if os.path.exists(index_path):
-        try:
-            idx = faiss.read_index(index_path)
-            if idx.ntotal == len(sentences):
-                log.info("Loaded FAISS: %s (d=%d n=%d)", index_path, idx.d, idx.ntotal)
-                return idx
-            else:
-                log.warning("FAISS ntotal mismatch (%d != %d). Rebuilding.", idx.ntotal, len(sentences))
-        except Exception as e:
-            log.warning("Failed to load FAISS (%s): %s", index_path, e)
-    if STATE.emb_model is None:
-        log.warning("No emb_model; skip FAISS build.")
         return None
-    log.info("Building FAISS (n=%d)...", len(sentences))
-    embeds = STATE.emb_model.encode(sentences, normalize_embeddings=True, show_progress_bar=True)
-    dim = embeds.shape[1]
-    idx = faiss.IndexFlatIP(dim)
-    idx.add(embeds.astype(np.float32))
-    safe_faiss_write(idx, index_path)
-    return idx
-def ensure_bm25(pkl_path: str, sentences: List[str]) -> Optional[Any]:
-    if BM25Okapi is None: return None
-    if os.path.exists(pkl_path):
-        try:
-            with open(pkl_path, "rb") as f:
-                bm = pickle.load(f)
-            # BM25 has corpus, not corpus_size attribute
-            n_bm = len(bm.corpus) if hasattr(bm, 'corpus') else 0
-            if n_bm == len(sentences):
-                log.info("Loaded BM25: %s (n=%d)", pkl_path, n_bm)
-                return bm
-            else:
-                log.warning("BM25 corpus size mismatch (%d != %d). Rebuilding.", n_bm, len(sentences))
-        except Exception as e:
-            log.warning("Failed to load BM25 (%s): %s", pkl_path, e)
-    log.info("Building BM25 (n=%d)...", len(sentences))
-    tokenized_corpus = [tokenize_zh(s) for s in sentences]
-    bm = BM25Okapi(tokenized_corpus)
-    safe_pickle_dump(bm, pkl_path)
-    return bm
-# ---------- 資訊解析與藥名處理 (簡化) ----------
-# 1. parse_user_message: 簡化為只比對藥名
-def parse_user_message(query: str, df: pd.DataFrame) -> Dict[str, Any]:
-    """
-    MODIFIED: 只比對 drug_name_norm，找最佳藥品。
-    """
-    best_drug = None
-    best_row = None
-    max_score = 0
-    if not fuzz:
-        log.warning("fuzzywuzzy not available; skipping fuzzy match.")
-        return {
-            "drug_name": None,
-            "drug_id": None,
-            "question": query,
-        }
-    # Use a pre-tokenized and normalized list for faster fuzzy matching
-    # In a real app, this should be pre-computed and stored for efficiency
-    unique_drugs = df.drop_duplicates(subset=['drug_id'])
-    # Check for direct match first
-    query_lower = query.lower().strip()
-    direct_match = unique_drugs[unique_drugs['drug_name_norm'].str.lower() == query_lower]
-    if not direct_match.empty:
-        best_row = direct_match.iloc[0]
-        best_drug = best_row["drug_name_norm"]
-        log.info(f"Direct match found: {best_drug}")
-    else:
-        for _, row in unique_drugs.iterrows():
-            drug_norm = (row.get('drug_name_norm') or "").lower()
-            score = fuzz.token_set_ratio(query_lower, drug_norm)
-            if score > max_score:
-                max_score = score
-                best_drug = drug_norm
-                best_row = row
-    if best_drug is None or max_score < 80: # 設定一個閾值來避免不相關的匹配
-        log.warning(f"No confident drug match found (score: {max_score})")
-        return {
-            "drug_name": None,
-            "drug_id": None,
-            "question": query,
-        }
-    log.info(f"Parsed user message (best match): {best_drug}, score: {max_score}")
-    return {
-      "drug_name": best_drug,
-      "drug_id": best_row["drug_id"],
-      "question": query
-    }
-# 2. find_drug_candidates: 簡化為單純 fuzzy 比對
-def find_drug_candidates(parsed_info: Dict[str, Any], df: pd.DataFrame, top_k: int = 5) -> List[Dict[str, Any]]:
-    """
-    MODIFIED: 單純對 drug_name_norm 做 fuzzy 比對，並回傳前 top_k 候選。
-    """
-    query_text = parsed_info.get("question", "").lower()
-    if df is None or df.empty or not query_text:
-        return []
-    if not fuzz:
         return []
-    candidates_list = []
-    unique_drugs = df.drop_duplicates(subset=['drug_id'])
-    for _, row in unique_drugs.iterrows():
-        drug_norm = (row.get('drug_name_norm') or "").lower()
-        score = fuzz.token_set_ratio(query_text, drug_norm)
-        candidates_list.append({
-            "drug_id": row["drug_id"],
-            "drug_name": drug_norm,
-            "score": score
-        })
-    # 依 score 排序並回傳前 top_k
-    sorted_candidates = sorted(candidates_list, key=lambda x: x['score'], reverse=True)
-    log.info(f"Found drug candidates: {sorted_candidates[:top_k]}")
-    return sorted_candidates[:top_k]
-# 3. answer_pipeline: 簡化流程
-async def answer_pipeline(query: str, user_id: str) -> str:
-    log.info("Pipeline start for user_id: %s, query: %s", user_id, query[:50])
-    if not query or not isinstance(query, str):
-        return handle_error("INVALID_QUERY")
-    if not STATE.sentences or not STATE.df_csv:
-        return handle_error("NO_CORPUS")
-    # 1. 解析使用者輸入並找到最佳藥品
-    best_drug_info = parse_user_message(query, STATE.df_csv)
-    if not best_drug_info.get("drug_id"):
-        log.warning("No confident drug match found.")
-        return make_clarify_message()
-    # 2. 呼叫 find_drug_candidates 產生候選清單
-    drug_candidates = find_drug_candidates(best_drug_info, STATE.df_csv)
-    # 3. 依 score >= 95 或與次高分差距 > 10 判斷是否選定最佳藥品
-    top_score = drug_candidates[0]['score'] if drug_candidates else 0
-    second_score = drug_candidates[1]['score'] if len(drug_candidates) > 1 else 0
-    if top_score >= 95 or (top_score - second_score) > 10:
-        log.info("Confidently selected drug: %s", best_drug_info['drug_name'])
-        drug_choice = best_drug_info
-    else:
-        log.info("Scores are too close, requesting clarification.")
-        options = [f"「{c.get('drug_name')}」" for c in drug_candidates[:3]]
-        return f"請問您指的是以下哪一種藥物？\n- " + "\n- ".join(options) + f"\n\n{DISCLAIMER}"
-    # 4. 檢索相關內文 (fuse_and_select)
-    idxs = fuse_and_select(
-        query=best_drug_info["question"],
-        sentences=STATE.sentences,
-        meta=STATE.meta,
-        bm25=STATE.bm25,
-        index=STATE.faiss_index,
-        emb_model=STATE.emb_model,
-        reranker=STATE.reranker_model,
-        top_k=TOP_K_SENTENCES,
-        drug_id=drug_choice['drug_id'],
-        # 移除 parsed_info
-    )
-    if not idxs:
-        return handle_error("NO_CONTEXT")
-    # 5. 建立上下文和 Prompt (build_prompt)
-    context = build_context(idxs, STATE.sentences, STATE.meta)
-    prompt = build_prompt(best_drug_info, context, drug_choice)
-    log.info("Generated Prompt:\n%s", prompt)
-    # 6. 呼叫 LLM 生成答案
-    answer = call_llm(prompt)
-    if not answer:
-        return handle_error("LLM_ERROR")
-    return f"{answer}\n\n{DISCLAIMER}"
-# 4. build_prompt: 簡化提示詞
-def build_prompt(parsed_info: Dict[str, Any], contexts: str, drug_choice: Dict[str, Any]) -> str:
-    """
-    MODIFIED: 簡化為只包含藥品名稱、使用者問題、參考片段。
-    """
-    return (
-        "你是一位專業、有同理心的藥師。請根據提供的「參考片段」，簡潔地回答使用者的「問題」。\n"
-        "---限制---\n"
-        "- 絕對忠於「參考片段」，不可捏造或過度推論。你的知識僅限於提供的片段。\n"
-        "- 回覆少於 120 字，並使用繁體中文條列式 2-4 點說明。\n"
-        "- 語氣親切、精簡、專業。\n"
-        "- 若片段中無足夠資訊回答，必須回覆：「根據提供的資料，我無法找到關於您問題的明確答案，建議您諮詢醫師或藥師。」\n"
-        "---輸入資訊---\n"
-        f"藥物名稱: {drug_choice.get('drug_name')}\n"
-        f"問題: {parsed_info.get('question')}\n\n"
-        f"參考片段:\n{contexts}\n"
-        "---你的回答---"
     )
-def call_llm(prompt: str, max_tokens: int = 2048) -> Optional[str]:
-    try:
-        from openai import OpenAI
-    except Exception as e:
-        log.warning("openai client 不可用：%s", e)
-        return None
-    if not (LITELLM_API_KEY and LM_MODEL and LITELLM_BASE_URL):
-        log.warning("LLM 未完整設定；略過生成。")
-        return None
-    client = OpenAI(base_url=LITELLM_BASE_URL, api_key=LITELLM_API_KEY)
     try:
-        t0 = time.time()
-        resp = client.chat.completions.create(
             model=LM_MODEL,
-            messages=[{"role": "user", "content": prompt}],
-            temperature=0.1,
-            timeout=15,
-            max_tokens=max_tokens,
         )
-        used = time.time() - t0
-        log.info("LLM ok (%.2fs)", used)
-        return (resp.choices[0].message.content or "").strip()
     except Exception as e:
-        log.warning("LLM 失敗：%s", e)
-        return None
-def make_clarify_message() -> str:
-    msg = (
-        "我需要更多資訊才能準確回答，請您提供：\n"
-        "1. 完整的藥物名稱\n"
-        "2. 您的具體問題\n\n"
-        f"{DISCLAIMER}"
-    )
-    return msg
-def handle_error(code: str) -> str:
-    log.error(f"Pipeline error: {code}")
-    return f"抱歉，系統暫時無法回覆 ({code})。請諮詢醫師或藥師。{DISCLAIMER}"
-# 5. fuse_and_select: 移除劑型加權
-def fuse_and_select(query: str, sentences: List[str], meta: List[Dict[str, Any]], bm25: Optional[Any], index: Optional[Any], emb_model: Optional[Any], reranker: Optional[Any], top_k: int = 10, drug_id: str = None) -> List[int]:
-    """
-    MODIFIED: 移除劑型加權。只保留 BM25/FAISS 融合 + 章節加權 + 意圖加權。
-    """
-    clean_query = query.strip().lower()
-    cache_key = clean_query + str(drug_id)
-    if cache_key in STATE.query_cache and time.time() - STATE.query_cache[cache_key]['time'] < 180:
-        log.info("Cache hit for query: %s", clean_query[:50])
-        return STATE.query_cache[cache_key]['idxs']
-    log.info("Searching for drug_id: %s with query: %s", drug_id, clean_query[:50])
-    if not drug_id:
-        log.warning("No drug_id provided; falling back to full corpus search.")
-    tokenized_query = tokenize_zh(clean_query)
-    scores = {}
-    # BM25 lexical search
-    if bm25:
-        bm_scores = bm25.get_scores(tokenized_query)
-        bm_scores_np = np.array(bm_scores)
-        if np.max(bm_scores_np) > np.min(bm_scores_np):
-            scores_norm = (bm_scores_np - np.min(bm_scores_np)) / (np.max(bm_scores_np) - np.min(bm_scores_np))
-        else:
-            scores_norm = bm_scores_np
-        for i, s_norm in enumerate(scores_norm):
-            if 0 <= i < len(meta) and (not drug_id or meta[i].get("drug_id") == drug_id):
-                scores[i] = scores.get(i, 0.0) + BM25_WEIGHT * s_norm
-    # FAISS semantic search
-    if emb_model and index:
-        q_emb = emb_model.encode([clean_query], normalize_embeddings=True).astype(np.float32)
-        _, idxs = index.search(q_emb, top_k * 8)
-        for rank, i in enumerate(idxs[0].tolist()):
-            if 0 <= i < len(meta) and (not drug_id or meta[i].get("drug_id") == drug_id):
-                scores[i] = scores.get(i, 0.0) + SEM_WEIGHT * (1.0 / (1 + rank))
-    # Apply boosts
-    for i in list(scores.keys()): # Iterate over a copy of keys
-        meta_item = meta[i]
-        # Section weight boost
-        sec = meta_item.get("section", "其他")
-        scores[i] *= SECTION_WEIGHTS.get(sec, 1.0)
-    # Boost based on detected intent
-    detected_intents = detect_intent(clean_query)
-    for i in list(scores.keys()):
-        meta_item = meta[i]
-        sec = meta_item.get("section", "其他")
-        if any(intent in detected_intents for intent in ["如何用藥 (Administration)", "用藥時間 (Timing)", "劑量調整 (Dosage Adjustment)"]) and sec in ["用法及用量", "病人使用須知"]:
-            scores[i] *= 1.5
-        elif any(intent in detected_intents for intent in ["保存/攜帶 (Storage & Handling)"]) and sec in ["儲存條件", "包裝及儲存"]:
-            scores[i] *= 1.5
-        elif any(intent in detected_intents for intent in ["副作用/異常 (Side Effects / Issues)"]) and sec in ["不良反應", "警語及注意事項"]:
-            scores[i] *= 1.5
-    # Inject important sections if they are missing
-    for sec in IMPORTANT_SECTIONS:
-        sec_idx = next((i for i, m in enumerate(meta) if (m.get("drug_id") == drug_id) and m.get("section") == sec), None)
-        if sec_idx is not None and sec_idx not in scores:
-            scores[sec_idx] = 1.0 # Give it a moderate score to ensure inclusion before reranking
-    # Prepare for reranking
-    candidates = [(i, sc, 0.0, 0.0) for i, sc in scores.items()]
-    reranked = rerank_results(clean_query, candidates, sentences, reranker, top_k, RERANK_THRESHOLD)
-    idxs = [r["idx"] for r in reranked]
-    STATE.query_cache[cache_key] = {'idxs': idxs, 'time': time.time()}
-    return idxs
-def build_context(idxs: List[int], sentences: List[str], meta: List[Dict[str, Any]]) -> str:
-    ctx_lines, total_len, seen = [], 0, set()
-    for i in idxs:
-        if i < 0: continue
-        text = sentences[i]
-        if text in seen: continue
-        chunk_id = meta[i].get("chunk_id", "None")
-        section = meta[i].get("section", "未知章節")
-        line = f"[{section}]: {text}"
-        if total_len + len(line) > MAX_CONTEXT_CHARS: break
-        ctx_lines.append(line)
-        total_len += len(line) + 1
-        seen.add(text)
-    return "\n".join(ctx_lines) or "[未知章節]: 沒有找到相關資料，請諮詢醫師或藥師。"
-# ---------- LINE 驗簽與回覆 ----------
-def verify_line_signature(body_bytes: bytes, signature: str) -> bool:
-    if not CHANNEL_SECRET:
-        log.warning("CHANNEL_SECRET 未設定；跳過簽章驗證（僅供測試）。")
-        return True
-    try:
-        mac = hmac.new(CHANNEL_SECRET.encode("utf-8"), body_bytes, hashlib.sha256).digest()
-        expected = base64.b64encode(mac).decode("utf-8")
-        return hmac.compare_digest(expected, signature)
-    except Exception as e:
-        log.warning("簽章驗證錯誤：%s", e)
-        return False
-def line_reply(reply_token: str, text: str) -> None:
-    if not CHANNEL_ACCESS_TOKEN or requests is None:
-        log.warning("缺少 CHANNEL_ACCESS_TOKEN 或 requests；略過回覆。")
-        return
-    url = "https://api.line.me/v2/bot/message/reply"
     headers = {
-        "Content-Type": "application/json",
-        "Authorization": f"Bearer {CHANNEL_ACCESS_TOKEN}",
     }
-    data = {"replyToken": reply_token, "messages": [{"type": "text", "text": text[:4900]}]}
     try:
-        r = requests.post(url, headers=headers, json=data, timeout=10)
-        if r.status_code != 200:
-            log.warning("LINE 回覆失敗：%s %s", r.status_code, r.text[:200])
     except Exception as e:
-        log.warning("LINE 回覆例外：%s", e)
-# ---------- 只有這一條路由：POST /webhook ----------
 @app.post("/webhook")
-async def webhook(request: Request, x_line_signature: str = Header(default="")):
-    body = await request.body()
-    if not verify_line_signature(body, x_line_signature):
-        raise HTTPException(status_code=401, detail="Invalid LINE signature")
-    try:
-        payload = await request.json()
-    except Exception:
-        raise HTTPException(status_code=400, detail="Invalid JSON body")
-    events = payload.get("events", [])
-    for ev in events:
-        if ev.get("type") == "message" and ev.get("message", {}).get("type") == "text":
-            reply_token = ev.get("replyToken")
-            user_id = ev.get("source", {}).get("userId", "unknown")
-            user_text = (ev.get("message", {}).get("text") or "").strip()
             try:
-                answer = await answer_pipeline(user_text, user_id)
             except Exception as e:
                 log.warning("Pipeline 失敗：%s", e)
-                answer = "抱歉，系統暫時無法回覆。"
             if reply_token:
                 line_reply(reply_token, answer)
     return {"ok": True}
@@ -704,25 +369,29 @@ async def _startup():
             log.info("PyTorch version %s available.", torch.__version__)
     except Exception:
         pass
     # 載入語料與索引
     STATE.sentences, STATE.meta = ensure_sentences_meta()
     STATE.emb_model = load_embedding_model(EMBEDDING_MODEL_ID)
     STATE.reranker_model = load_reranker_model(RERANKER_MODEL_ID)
     STATE.faiss_index = ensure_faiss(FAISS_INDEX, STATE.sentences)
     STATE.bm25 = ensure_bm25(BM25_PKL, STATE.sentences)
     for m in STATE.meta:
         sec = m.get("section", "其他")
         m["section"] = SECTION_NORMALIZE.get(sec, sec)
-    if os.path.exists(CSV_PATH):
-        STATE.df_csv = pd.read_csv(CSV_PATH, dtype=str)
-    log.info("LLM via LiteLLM: base=%s model=%s", str(LITELLM_BASE_URL), str(LM_MODEL))
-    log.info("Startup complete.")
-@app.get("/")
-async def health():
-    return {"status": "healthy"}
 if __name__ == "__main__":
     import uvicorn
-    port = int(os.getenv("PORT", "7860"))
-    uvicorn.run("app:app", host="0.0.0.0", port=port, log_level=LOG_LEVEL.lower(), reload=False)

 # ---------- Imports ----------
 import re, hmac, base64, hashlib, pickle, logging, time, json
 from typing import List, Dict, Any, Optional, Tuple, Union
+from functools import lru_cache
 import numpy as np
 import pandas as pd
     torch = None
 try:
+    import faiss # 僅用於檢查 faiss 是否安裝
+except Exception:
+    faiss = None
 try:
+    from sentence_transformers import SentenceTransformer
 except Exception:
     SentenceTransformer = None
 try:
+    from rank_bm25 import BM25Okapi
 except Exception:
     BM25Okapi = None
+from litellm import completion
+from fastapi import FastAPI, Request
+from pydantic import BaseModel
+from pydantic_settings import BaseSettings
+# ---------- Logging Setup ----------
+logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(levelname)s - %(message)s')
+log = logging.getLogger(__name__)
+# ---------- Constants & Paths ----------
+CONFIG_PATH = os.path.join(os.path.dirname(__file__), ".env")
+SENTENCES_PKL = os.path.join(os.path.dirname(__file__), "drug_sentences.pkl")
+FAISS_INDEX = os.path.join(os.path.dirname(__file__), "drug_sentences.index")
+BM25_PKL = os.path.join(os.path.dirname(__file__), "bm25.pkl")
+CSV_PATH = os.path.join(os.path.dirname(__file__), "cleaned_combined.csv")
+# fallback to /tmp
+for p in (SENTENCES_PKL, FAISS_INDEX, BM25_PKL):
+    if not os.path.exists(p):
+        log.warning("File not found: %s, fallback to /tmp", p)
+        # 允許重建，但只寫到 /tmp
+        SENTENCES_PKL = os.path.join("/tmp", os.path.basename(SENTENCES_PKL))
+        FAISS_INDEX = os.path.join("/tmp", os.path.basename(FAISS_INDEX))
+        BM25_PKL = os.path.join("/tmp", os.path.basename(BM25_PKL))
+        break
+# https://docs.huggingface.co/huggingface_hub/package_reference/environment_variables#general-purpose
+# https://docs.sentence-transformers.com/en/latest/quickstart.html
+EMBEDDING_MODEL_ID = os.getenv("EMBEDDING_MODEL_ID", "AI-infinity/bge-m3-zh-tw")
+RERANKER_MODEL_ID = os.getenv("RERANKER_MODEL_ID", "AI-infinity/bge-reranker-base-zh-tw")
+LM_MODEL = os.getenv("LM_MODEL", "azure/gpt-4o")
 SECTION_NORMALIZE = {
+    '適應症': '適應症', '用法用量': '用法用量', '副作用': '副作用',
+    '禁忌': '禁忌', '警語注意事項': '警語及注意事項', '藥品外觀': '藥品外觀'
 }
+# ---------- State Management ----------
+class AppState:
+    def __init__(self):
+        self.sentences: List[str] = []
+        self.meta: List[Dict[str, Any]] = []
+        self.emb_model: Optional[SentenceTransformer] = None
+        self.reranker_model: Optional[SentenceTransformer] = None
+        self.faiss_index: Optional[faiss.Index] = None
+        self.bm25: Optional[BM25Okapi] = None
+        self.df_csv: Optional[pd.DataFrame] = None
+STATE = AppState()
+# ---------- Helper Functions (RAG pipeline) ----------
+def ensure_sentences_meta():
     if os.path.exists(SENTENCES_PKL):
+        log.info("Loading sentences from %s", SENTENCES_PKL)
+        with open(SENTENCES_PKL, "rb") as f:
+            sentences, meta = pickle.load(f)
+        return sentences, meta
+    if not os.path.exists(CSV_PATH):
+        log.error("CSV file not found: %s", CSV_PATH)
+        return [], []
+    df = pd.read_csv(CSV_PATH)
+    sentences = (df["section"] + "：" + df["content"]).tolist()
+    meta = df.to_dict(orient="records")
+    log.info("Building sentences from CSV (total=%d)", len(sentences))
+    with open(SENTENCES_PKL, "wb") as f:
+        pickle.dump((sentences, meta), f)
+    return sentences, meta
+@lru_cache(maxsize=1)
 def load_embedding_model(model_id: str):
     if SentenceTransformer is None:
+        log.error("SentenceTransformer not installed. Please install it.")
         return None
     try:
+        if torch is not None and torch.cuda.is_available():
+            log.info("Using GPU for embedding model: %s", model_id)
+            device = "cuda"
+        else:
+            log.info("Using CPU for embedding model: %s", model_id)
+            device = "cpu"
+        model = SentenceTransformer(model_id, device=device)
+        return model
     except Exception as e:
+        log.error("Failed to load embedding model: %s, error: %s", model_id, e)
         return None
+@lru_cache(maxsize=1)
 def load_reranker_model(model_id: str):
+    if SentenceTransformer is None:
+        log.error("SentenceTransformer not installed. Please install it.")
         return None
     try:
+        if torch is not None and torch.cuda.is_available():
+            log.info("Using GPU for reranker model: %s", model_id)
+            device = "cuda"
+        else:
+            log.info("Using CPU for reranker model: %s", model_id)
+            device = "cpu"
+        model = SentenceTransformer(model_id, device=device)
+        return model
     except Exception as e:
+        log.error("Failed to load reranker model: %s, error: %s", model_id, e)
         return None
+def ensure_faiss(index_path: str, sentences: List[str]):
+    if faiss is None:
+        log.error("FAISS not installed. Please install it.")
         return None
+    if os.path.exists(index_path):
+        log.info("Loading FAISS index from %s", index_path)
+        return faiss.read_index(index_path)
+    log.info("Building FAISS index (total=%d)", len(sentences))
+    embeddings = STATE.emb_model.encode(sentences, show_progress_bar=True)
+    index = faiss.IndexFlatL2(embeddings.shape[1])
+    index.add(embeddings)
+    faiss.write_index(index, index_path)
+    return index
+def ensure_bm25(bm25_path: str, sentences: List[str]):
+    if BM25Okapi is None:
+        log.error("BM25Okapi not installed. Please install it.")
+        return None
+    if os.path.exists(bm25_path):
+        log.info("Loading BM25 index from %s", bm25_path)
+        with open(bm25_path, 'rb') as f:
+            bm25 = pickle.load(f)
+        return bm25
+    log.info("Building BM25 index (total=%d)", len(sentences))
+    tokenized_corpus = [s.split(" ") for s in sentences]
+    bm25 = BM25Okapi(tokenized_corpus)
+    with open(bm25_path, 'wb') as f:
+        pickle.dump(bm25, f)
+    return bm25
+def retrieve_top_k_passages(query: str, k: int=10):
+    if STATE.emb_model is None or STATE.faiss_index is None or STATE.bm25 is None:
         return []
+    # FAISS retrieval
+    query_embedding = STATE.emb_model.encode([query])
+    _, faiss_indices = STATE.faiss_index.search(query_embedding, k)
+    faiss_passages = [STATE.sentences[i] for i in faiss_indices[0]]
+    # BM25 retrieval
+    bm25_scores = STATE.bm25.get_scores(query.split(" "))
+    bm25_indices = np.argsort(bm25_scores)[::-1][:k]
+    bm25_passages = [STATE.sentences[i] for i in bm25_indices]
+    # Combine and deduplicate
+    combined_passages = list(dict.fromkeys(faiss_passages + bm25_passages))
+    # Reranking
+    reranker_scores = STATE.reranker_model.rank(query, combined_passages)
+    # Sort and return top k
+    reranked_passages = [p for _, p in sorted(zip(reranker_scores, combined_passages), reverse=True)][:k]
+    return reranked_passages
+def generate_answer(query: str, passages: List[str]):
+    context = "\n".join(passages)
+    system_prompt = (
+        "你是一位專業藥師，請根據以下提供的藥品資訊內容，使用繁體中文簡潔且準確地回答問題。 "
+        "你的回覆應清楚、易懂，且只引用提供的內容。若提供的內容無法回答問題，請直接說「抱歉，我無法從現有資料中找到相關資訊。」"
+        "回答時請依據不同段落整理成條列式或分段式，並在回覆最後加上免責聲明「本資訊僅供參考，實際用藥請諮詢專業醫師或藥師。」。"
     )
+    user_prompt = f"問題: {query}\n\n藥品資訊:\n{context}\n\n回覆:"
     try:
+        response = completion(
             model=LM_MODEL,
+            messages=[
+                {"role": "system", "content": system_prompt},
+                {"role": "user", "content": user_prompt}
+            ],
+            temperature=0.0
         )
+        return response.choices[0].message.content
     except Exception as e:
+        log.error("LLM completion failed: %s", e)
+        return "抱歉，系統暫時無法回覆。請稍後再試。"
+# ---------- FastAPI App & Webhook Logic ----------
+class Settings(BaseSettings):
+    channel_access_token: str
+    channel_secret: str
+    class Config:
+        env_file = ".env"
+        env_file_encoding = "utf-8"
+try:
+    settings = Settings()
+except Exception as e:
+    log.error("Failed to load environment variables from .env: %s", e)
+    log.warning("Trying to load from system environment variables...")
+    settings = Settings(_env_file=None) # fall back to system env
+app = FastAPI()
+class LineEvent(BaseModel):
+    replyToken: str
+    message: Dict[str, str]
+class LineWebhook(BaseModel):
+    events: List[LineEvent]
+    destination: str
+def line_reply(reply_token: str, message: str):
+    import requests
     headers = {
+        "Content-Type": "application/json; charset=UTF-8",
+        "Authorization": f"Bearer {settings.channel_access_token}"
+    }
+    data = {
+        "replyToken": reply_token,
+        "messages": [{"type": "text", "text": message}]
     }
     try:
+        response = requests.post("https://api.line.me/v2/bot/message/reply", headers=headers, json=data, timeout=5)
+        response.raise_for_status()
+        log.info("LINE reply success: %s", response.status_code)
     except Exception as e:
+        log.error("LINE reply failed: %s", e)
+# 為了快速比對藥名，預先正規化
+# REVISED: 新增程式碼區塊
+if STATE.df_csv is not None:
+    STATE.df_csv['drug_name_norm_normalized'] = STATE.df_csv['drug_name_norm'].str.lower().str.replace(r'[^\w\s]', '', regex=True).str.strip()
 @app.post("/webhook")
+async def handle_webhook(webhook: LineWebhook, request: Request):
+    # 驗證簽章
+    signature = request.headers.get("x-line-signature")
+    if signature is None:
+        log.warning("Signature is missing.")
+        return {"ok": False}
+    body = (await request.body()).decode("utf-8")
+    hash_body = hmac.new(settings.channel_secret.encode('utf-8'), body.encode('utf-8'), hashlib.sha256).digest()
+    if not hmac.compare_digest(hash_body, base64.b64decode(signature)):
+        log.warning("Invalid signature.")
+        return {"ok": False}
+    for event in webhook.events:
+        reply_token = event.replyToken
+        msg_type = event.message.get("type")
+        if msg_type == "text":
+            user_text = event.message.get("text", "")
+            log.info("Received message: %s", user_text)
+            answer = "抱歉，系統暫時無法回覆。"
             try:
+                # REVISED: 優先處理單一藥名精確比對
+                if STATE.df_csv is not None:
+                    normalized_user_text = user_text.lower().replace(r'[^\w\s]', '').strip()
+                    # 檢查是否為單一藥名查詢
+                    matches = STATE.df_csv[STATE.df_csv['drug_name_norm_normalized'] == normalized_user_text]
+                    if not matches.empty:
+                        unique_drug_ids = matches['drug_id'].nunique()
+                        if unique_drug_ids == 1:
+                            log.info("Exact match found for single drug name: %s", user_text)
+                            # 獲取該藥品的所有資訊
+                            target_drug_id = matches['drug_id'].iloc[0]
+                            relevant_rows = STATE.df_csv[STATE.df_csv['drug_id'] == target_drug_id]
+                            # 組合所有相關段落內容
+                            combined_content = []
+                            for section in relevant_rows['section'].unique():
+                                section_content = "\n".join(relevant_rows[relevant_rows['section'] == section]['content'].tolist())
+                                combined_content.append(f"{section}：{section_content}")
+                            # 傳給 LLM 進行摘要與回覆生成
+                            passages_for_llm = combined_content
+                            answer = generate_answer(query=user_text, passages=passages_for_llm)
+                        # 不符合單一藥名比對條件，或有多個 drug_id，則走原本的 RAG 流程
+                        else:
+                            log.info("Multiple drugs or no exact match, falling back to RAG pipeline.")
+                            passages = retrieve_top_k_passages(user_text)
+                            answer = generate_answer(query=user_text, passages=passages)
+                    else:
+                        # 找不到精確匹配，走原本的 RAG 流程
+                        passages = retrieve_top_k_passages(user_text)
+                        answer = generate_answer(query=user_text, passages=passages)
+                else:
+                    # 如果 CSV 沒有載入，也走 RAG 流程
+                    passages = retrieve_top_k_passages(user_text)
+                    answer = generate_answer(query=user_text, passages=passages)
             except Exception as e:
                 log.warning("Pipeline 失敗：%s", e)
+                answer = "抱歉，系統暫時無法回覆。請稍後再試。"
             if reply_token:
                 line_reply(reply_token, answer)
     return {"ok": True}
             log.info("PyTorch version %s available.", torch.__version__)
     except Exception:
         pass
+    # 載入 CSV
+    if os.path.exists(CSV_PATH):
+        STATE.df_csv = pd.read_csv(CSV_PATH, dtype=str)
+        log.info("Loaded CSV: %s (rows=%d)", CSV_PATH, len(STATE.df_csv))
+    else:
+        log.warning("CSV not found: %s", CSV_PATH)
     # 載入語料與索引
     STATE.sentences, STATE.meta = ensure_sentences_meta()
     STATE.emb_model = load_embedding_model(EMBEDDING_MODEL_ID)
     STATE.reranker_model = load_reranker_model(RERANKER_MODEL_ID)
     STATE.faiss_index = ensure_faiss(FAISS_INDEX, STATE.sentences)
     STATE.bm25 = ensure_bm25(BM25_PKL, STATE.sentences)
     for m in STATE.meta:
         sec = m.get("section", "其他")
         m["section"] = SECTION_NORMALIZE.get(sec, sec)
+    log.info("LLM Model: %s", LM_MODEL)
+    log.info("===== Application Ready =====")
+# This is a sample code to test the API locally.
 if __name__ == "__main__":
     import uvicorn
+    uvicorn.run(app, host="0.0.0.0", port=8000)