Spaces:

dayuian
/

VocabLine

Running

App Files Files Community

dayuian commited on 11 days ago

Commit

3ed2d28

verified ·

1 Parent(s): 4982f66

Update vocab.py

Browse files

Files changed (1) hide show

vocab.py +18 -57

vocab.py CHANGED Viewed

@@ -1,67 +1,28 @@
-import sqlite3
 import os
 import json
-import random
-from ai_sentence import generate_sentence
-from tqdm import tqdm
 DATA_DIR = "./data"
-DB_PATH = os.path.join(DATA_DIR, "sentences.db")
-# 抽單字 & 查例句或 GPT 生成例句
-def get_words_with_sentences(source, n):
-    try:
-        # 取得單字庫所有單字資料
-        with open(os.path.join(DATA_DIR, f"{source}.json"), 'r', encoding='utf-8') as f:
-            words = json.load(f)
-        selected_words = random.sample(words, n)
-        result_display = ""
-        for word_data in tqdm(selected_words, desc="處理單字"):
-            word = word_data['word']
-            phonetic = word_data['phonetic']
-            # 查詢句庫
-            conn = sqlite3.connect(DB_PATH)
-            c = conn.cursor()
-            c.execute('SELECT sentence, source, model FROM sentences WHERE word=?', (word,))
-            sentence_records = c.fetchall()
-            conn.close()
-            if sentence_records:
-                # 優先取 Tatoeba
-                sentence = ""
-                for rec in sentence_records:
-                    if rec[1] == "tatoeba":
-                        sentence = rec[0]
-                        break
-                if not sentence:
-                    sentence = sentence_records[0][0]
-            else:
-                # 如果句庫沒有，生成 GPT 句子
-                sentence = generate_sentence(word, "EleutherAI/pythia-410m")
-                # 存回資料庫
-                conn = sqlite3.connect(DB_PATH)
-                c = conn.cursor()
-                c.execute('''
-                    INSERT INTO sentences (word, phonetic, sentence, source, model)
-                    VALUES (?, ?, ?, ?, ?)
-                    ON CONFLICT(word, source, model) DO UPDATE SET sentence=excluded.sentence, phonetic=excluded.phonetic
-                ''', (word, phonetic, sentence, "ai", "EleutherAI/pythia-410m"))
-                conn.commit()
-                conn.close()
-            result_display += f"""
-            <div style="margin-bottom: 10px; padding: 8px; border-left: 4px solid #4CAF50; background-color: #f9f9f9;">
-                <strong>單字：</strong> {word} <br>
-                <strong>音標：</strong> {phonetic or '無'} <br>
-                <strong>句子：</strong> {sentence}
-            </div>
-            """
-        return result_display, "✅ 抽單字 & 生成完成"
-    except Exception as e:
-        return f"<p style='color:red;'>❌ 發生錯誤：{str(e)}</p>", f"❌ 錯誤：{str(e)}"

 import os
 import json
 DATA_DIR = "./data"
+# 取得單字庫名稱清單
+def get_sources():
+    files = os.listdir(DATA_DIR)
+    sources = [f.split(".json")[0] for f in files if f.endswith(".json")]
+    return sources
+# 取得單字庫的所有單字（回傳整個物件列表）
+def get_words_from_source(source):
+    data_path = os.path.join(DATA_DIR, f"{source}.json")
+    with open(data_path, 'r', encoding='utf-8') as f:
+        words = json.load(f)
+    return words
+# 查詢單字細節（音標等）
+def get_word_info(source, word):
+    words = get_words_from_source(source)
+    for entry in words:
+        if entry['word'] == word:
+            return entry  # 回傳 {'id': 1, 'word': 'apple', 'phonetic': '...'}
+    return None  # 找不到單字