Spaces:

Andy0830
/

SYSTEM

Running

App Files Files Community

Andy0830 commited on 13 days ago

Commit

0ed4edb

verified ·

1 Parent(s): ef488f7

Update app.py

Browse files

Files changed (1) hide show

app.py +18 -25

app.py CHANGED Viewed

@@ -10,9 +10,12 @@ import time
 # --- 系統設定 ---
 SYSTEM_TITLE = "花蓮慈濟醫院公文輔助判決系統"
 FILE_PATH = 'data.csv'
-# ▼▼▼ 關鍵：定義索引檔案儲存路徑 ▼▼▼
 INDEX_FILE = 'corpus_embeddings.pt'
 # --- 1. 讀取資料 ---
 print("🚀 正在啟動快取模式...")
@@ -21,7 +24,6 @@ if not os.path.exists(FILE_PATH):
     sys.exit(1)
 try:
-    # 讀取檔案 (維持 CP950 容錯)
     df = pd.read_csv(FILE_PATH, encoding='cp950')
 except UnicodeDecodeError:
     try:
@@ -50,9 +52,7 @@ else:
     corpus = []
     total_records = 0
-# --- 3. 載入模型與建立索引 (關鍵：檢查快取) ---
-# 檢查模型是否已經載入
 model = None
 try:
     print("🧠 正在載入模型 (BAAI/bge-small-zh-v1.5)...")
@@ -64,21 +64,18 @@ corpus_embeddings = None
 if total_records > 0 and model is not None:
     if os.path.exists(INDEX_FILE):
-        # 快取存在，直接載入，快速啟動！
-        print(f"⚡ 偵測到快取檔案 ({INDEX_FILE})，正在秒速載入...")
         try:
             corpus_embeddings = torch.load(INDEX_FILE)
-            print("✅ 索引載入完成，系統秒速啟動！")
         except Exception as e:
-            print(f"❌ 快取檔案損壞，將重新計算索引。錯誤: {e}")
-            corpus_embeddings = None # 設為 None 重新計算
     if corpus_embeddings is None:
-        # 第一次啟動或快取損壞，進行耗時的計算
-        print(f"🔥 第一次啟動或快取失效，開始分批計算索引 (這需要約 2-4 分鐘)...")
         chunk_size = 500
         embeddings_chunks = []
-        start_time = time.time()
         try:
             for i in range(0, total_records, chunk_size):
@@ -88,23 +85,18 @@ if total_records > 0 and model is not None:
                 print(f"   -> 已處理 {min(i + chunk_size, total_records)} / {total_records} 筆...")
                 gc.collect()
-            # 合併與儲存
-            print("🔗 正在合併並儲存索引...")
             corpus_embeddings = torch.cat(embeddings_chunks)
-            torch.save(corpus_embeddings, INDEX_FILE) # ▼▼▼ 儲存索引到硬碟 ▼▼▼
-            end_time = time.time()
-            print(f"✅ 全量索引計算並儲存完成！耗時 {int(end_time - start_time)} 秒。")
         except Exception as e:
-            print(f"❌ 索引計算失敗 (可能記憶體不足): {e}")
             corpus_embeddings = None
 # --- 4. 定義搜尋 ---
 def search_department(query):
-    # 這裡的邏輯與之前相同，不需要修改
     if corpus_embeddings is None:
-        return "⚠️ 系統初始化失敗，請檢查 Logs。"
     if not query.strip():
         return "請輸入公文主旨..."
@@ -134,15 +126,16 @@ def search_department(query):
     return output_text
-# --- 5. 介面 ---
 iface = gr.Interface(
     fn=search_department,
     inputs=gr.Textbox(lines=3, placeholder="請輸入公文主旨..."),
     outputs=gr.Textbox(lines=12, label="AI 判決建議"),
     title=SYSTEM_TITLE,
-    description=f"系統狀態：{'🟢 快取就緒' if corpus_embeddings is not None else '🔴 索引失敗'}\n資料庫完整收錄：{total_records} 筆歷史資料 (無刪減)",
     examples=[["檢送本署彙整人工生殖機構之捐贈生殖細胞使用情形"], ["函轉衛生局關於流感疫苗接種計畫"]]
 )
 if __name__ == "__main__":
-    iface.launch()

 # --- 系統設定 ---
 SYSTEM_TITLE = "花蓮慈濟醫院公文輔助判決系統"
 FILE_PATH = 'data.csv'
 INDEX_FILE = 'corpus_embeddings.pt'
+# ▼▼▼ 設定登入帳號密碼 (您可以修改這裡) ▼▼▼
+# 格式：("帳號", "密碼")
+LOGIN_DATA = ("admin", "1234")
 # --- 1. 讀取資料 ---
 print("🚀 正在啟動快取模式...")
     sys.exit(1)
 try:
     df = pd.read_csv(FILE_PATH, encoding='cp950')
 except UnicodeDecodeError:
     try:
     corpus = []
     total_records = 0
+# --- 3. 載入模型與建立索引 ---
 model = None
 try:
     print("🧠 正在載入模型 (BAAI/bge-small-zh-v1.5)...")
 if total_records > 0 and model is not None:
     if os.path.exists(INDEX_FILE):
+        print(f"⚡ 偵測到快取檔案，正在秒速載入...")
         try:
             corpus_embeddings = torch.load(INDEX_FILE)
+            print("✅ 索引載入完成！")
         except Exception as e:
+            print(f"❌ 快取檔案損壞，將重新計算。錯誤: {e}")
+            corpus_embeddings = None
     if corpus_embeddings is None:
+        print(f"🔥 開始計算索引 (需時約 2-4 分鐘)...")
         chunk_size = 500
         embeddings_chunks = []
         try:
             for i in range(0, total_records, chunk_size):
                 print(f"   -> 已處理 {min(i + chunk_size, total_records)} / {total_records} 筆...")
                 gc.collect()
             corpus_embeddings = torch.cat(embeddings_chunks)
+            torch.save(corpus_embeddings, INDEX_FILE)
+            print("✅ 索引計算並儲存完成！")
         except Exception as e:
+            print(f"❌ 索引計算失敗: {e}")
             corpus_embeddings = None
 # --- 4. 定義搜尋 ---
 def search_department(query):
     if corpus_embeddings is None:
+        return "⚠️ 系統初始化失敗。"
     if not query.strip():
         return "請輸入公文主旨..."
     return output_text
+# --- 5. 介面 (包含密碼鎖) ---
 iface = gr.Interface(
     fn=search_department,
     inputs=gr.Textbox(lines=3, placeholder="請輸入公文主旨..."),
     outputs=gr.Textbox(lines=12, label="AI 判決建議"),
     title=SYSTEM_TITLE,
+    description=f"系統狀態：{'🟢 系統正常' if corpus_embeddings is not None else '🔴 異常'}\n資料庫收錄：{total_records} 筆歷史資料",
     examples=[["檢送本署彙整人工生殖機構之捐贈生殖細胞使用情形"], ["函轉衛生局關於流感疫苗接種計畫"]]
 )
 if __name__ == "__main__":
+    # ▼▼▼ 這裡加上了 auth 參數，啟動時會要求輸入帳號密碼 ▼▼▼
+    iface.launch(auth=LOGIN_DATA)