Spaces:

Andy0830
/

SYSTEM

Running

App Files Files Community

Andy0830 commited on 5 days ago

Commit

8c3f3bc

verified ·

1 Parent(s): 0ed4edb

Update app.py

Browse files

Files changed (1) hide show

app.py +15 -7

app.py CHANGED Viewed

@@ -12,18 +12,19 @@ SYSTEM_TITLE = "花蓮慈濟醫院公文輔助判決系統"
 FILE_PATH = 'data.csv'
 INDEX_FILE = 'corpus_embeddings.pt'
-# ▼▼▼ 設定登入帳號密碼 (您可以修改這裡) ▼▼▼
 # 格式：("帳號", "密碼")
-LOGIN_DATA = ("admin", "1234")
 # --- 1. 讀取資料 ---
-print("🚀 正在啟動快取模式...")
 if not os.path.exists(FILE_PATH):
     print(f"❌ 錯誤：找不到 {FILE_PATH}")
     sys.exit(1)
 try:
     df = pd.read_csv(FILE_PATH, encoding='cp950')
 except UnicodeDecodeError:
     try:
@@ -35,11 +36,15 @@ except Exception:
 # --- 2. 資料清洗 ---
 if not df.empty:
     df.columns = [str(c).strip().replace('\ufeff', '') for c in df.columns]
     for col in df.columns:
         if '主旨' in col or '內容' in col: df.rename(columns={col: '主旨'}, inplace=True)
         if '窗口' in col or '單位' in col: df.rename(columns={col: '收文窗口'}, inplace=True)
     df['主旨'] = df['主旨'].astype(str)
     df['收文窗口'] = df['收文窗口'].astype(str)
     df = df.dropna(subset=['主旨', '收文窗口'])
@@ -63,6 +68,7 @@ except Exception as e:
 corpus_embeddings = None
 if total_records > 0 and model is not None:
     if os.path.exists(INDEX_FILE):
         print(f"⚡ 偵測到快取檔案，正在秒速載入...")
         try:
@@ -72,8 +78,9 @@ if total_records > 0 and model is not None:
             print(f"❌ 快取檔案損壞，將重新計算。錯誤: {e}")
             corpus_embeddings = None
     if corpus_embeddings is None:
-        print(f"🔥 開始計算索引 (需時約 2-4 分鐘)...")
         chunk_size = 500
         embeddings_chunks = []
@@ -86,6 +93,7 @@ if total_records > 0 and model is not None:
                 gc.collect()
             corpus_embeddings = torch.cat(embeddings_chunks)
             torch.save(corpus_embeddings, INDEX_FILE)
             print("✅ 索引計算並儲存完成！")
@@ -96,7 +104,7 @@ if total_records > 0 and model is not None:
 # --- 4. 定義搜尋 ---
 def search_department(query):
     if corpus_embeddings is None:
-        return "⚠️ 系統初始化失敗。"
     if not query.strip():
         return "請輸入公文主旨..."
@@ -126,7 +134,7 @@ def search_department(query):
     return output_text
-# --- 5. 介面 (包含密碼鎖) ---
 iface = gr.Interface(
     fn=search_department,
     inputs=gr.Textbox(lines=3, placeholder="請輸入公文主旨..."),
@@ -137,5 +145,5 @@ iface = gr.Interface(
 )
 if __name__ == "__main__":
-    # ▼▼▼ 這裡加上了 auth 參數，啟動時會要求輸入帳號密碼 ▼▼▼
     iface.launch(auth=LOGIN_DATA)

 FILE_PATH = 'data.csv'
 INDEX_FILE = 'corpus_embeddings.pt'
+# ▼▼▼ 設定登入帳號密碼 (已更新) ▼▼▼
 # 格式：("帳號", "密碼")
+LOGIN_DATA = ("admin", "htch15583")
 # --- 1. 讀取資料 ---
+print("🚀 正在啟動系統...")
 if not os.path.exists(FILE_PATH):
     print(f"❌ 錯誤：找不到 {FILE_PATH}")
     sys.exit(1)
 try:
+    # 讀取檔案 (CP950 優先)
     df = pd.read_csv(FILE_PATH, encoding='cp950')
 except UnicodeDecodeError:
     try:
 # --- 2. 資料清洗 ---
 if not df.empty:
+    # 移除 BOM 與空白
     df.columns = [str(c).strip().replace('\ufeff', '') for c in df.columns]
+    # 自動對應欄位
     for col in df.columns:
         if '主旨' in col or '內容' in col: df.rename(columns={col: '主旨'}, inplace=True)
         if '窗口' in col or '單位' in col: df.rename(columns={col: '收文窗口'}, inplace=True)
+    # 轉字串 & 移除空值
     df['主旨'] = df['主旨'].astype(str)
     df['收文窗口'] = df['收文窗口'].astype(str)
     df = df.dropna(subset=['主旨', '收文窗口'])
 corpus_embeddings = None
 if total_records > 0 and model is not None:
+    # 檢查是否有快取檔案
     if os.path.exists(INDEX_FILE):
         print(f"⚡ 偵測到快取檔案，正在秒速載入...")
         try:
             print(f"❌ 快取檔案損壞，將重新計算。錯誤: {e}")
             corpus_embeddings = None
+    # 如果沒有快取，則進行計算
     if corpus_embeddings is None:
+        print(f"🔥 開始計算索引 (需時約 2-4 分鐘，請耐心等候)...")
         chunk_size = 500
         embeddings_chunks = []
                 gc.collect()
             corpus_embeddings = torch.cat(embeddings_chunks)
+            # 儲存到硬碟，下次啟動就會很快
             torch.save(corpus_embeddings, INDEX_FILE)
             print("✅ 索引計算並儲存完成！")
 # --- 4. 定義搜尋 ---
 def search_department(query):
     if corpus_embeddings is None:
+        return "⚠️ 系統初始化失敗，請檢查 Logs。"
     if not query.strip():
         return "請輸入公文主旨..."
     return output_text
+# --- 5. 介面 (已啟用密碼鎖) ---
 iface = gr.Interface(
     fn=search_department,
     inputs=gr.Textbox(lines=3, placeholder="請輸入公文主旨..."),
 )
 if __name__ == "__main__":
+    # 啟動時加入驗證
     iface.launch(auth=LOGIN_DATA)