Spaces:

dayuian
/

VocabLine

Running

App Files Files Community

dayuian commited on Feb 18

Commit

2a9478d

verified ·

1 Parent(s): e7b5b55

Update app.py

Browse files

Files changed (1) hide show

app.py +55 -76

app.py CHANGED Viewed

@@ -1,79 +1,58 @@
 import gradio as gr
-import json
-import random
-from transformers import AutoModelForCausalLM, AutoTokenizer
-import os
-import re
-# 模型初始化
-model_name = "EleutherAI/pythia-410m"
-tokenizer = AutoTokenizer.from_pretrained(model_name)
-model = AutoModelForCausalLM.from_pretrained(model_name)
-# 資料夾
-DATA_DIR = "./data"
-# 自動掃描資料夾生成選單
-def get_sources():
-    files = os.listdir(DATA_DIR)
-    sources = [f.split(".json")[0] for f in files if f.endswith(".json")]
-    return sources
-# 清理 GPT 生成句子的雜訊
-def clean_sentence(output):
-    output = re.sub(r"Write.*?beginners\.", "", output, flags=re.IGNORECASE).strip()
-    output = re.sub(r"\*\*?\d+\.*\*\*", "", output).strip()
-    if not output.endswith("."):
-        output += "."
-    return output
-# 核心函數
-def get_words_with_sentences(source, n):
-    status = []
-    try:
-        data_path = os.path.join(DATA_DIR, f"{source}.json")
-        with open(data_path, 'r', encoding='utf-8') as f:
-            words = json.load(f)
-        selected_words = random.sample(words, n)
-        results = []
-        for i, word_data in enumerate(selected_words):
-            status.append(f"正在生成第 {i+1}/{n} 個單字 [{word_data['word']}] 例句...")
-            word = word_data['word']
-            prompt = f"Use the word '{word}' in a simple English sentence suitable for beginners. Output only the sentence."
-            inputs = tokenizer(prompt, return_tensors="pt")
-            outputs = model.generate(**inputs, max_new_tokens=30)
-            sentence = tokenizer.decode(outputs[0], skip_special_tokens=True)
-            clean_output = clean_sentence(sentence)
-            results.append({
-                "word": word,
-                "phonetic": word_data["phonetic"],
-                "sentence": clean_output
-            })
-        status.append("✅ 完成！")
-        return results, status
-    except Exception as e:
-        status.append(f"❌ 發生錯誤: {str(e)}")
-        return [], status
-# Gradio 介面
-demo = gr.Interface(
-    fn=get_words_with_sentences,
-    inputs=[
-        gr.Dropdown(choices=get_sources(), value="common3000", label="選擇單字庫", interactive=True, show_clear_button=False),
-        gr.Number(value=10, label="抽幾個單字")
-    ],
-    outputs=[
-        gr.JSON(label="生成結果"),
-        gr.JSON(label="生成進度")
-    ]
-)
 demo.launch()

 import gradio as gr
+from vocab import get_sources, get_words_with_sentences
+with gr.Blocks() as demo:
+    gr.Markdown(
+        """
+        # 📖 英文單字隨機抽取 & GPT 例句生成 API
+        ## 📝 專案簡介
+        本專案提供一個 API 服務，能夠從不同的單字庫隨機抽取單字，並使用開源語言模型自動生成例句。
+        適合作為 LINE 單字推播、自學工具、英文教學輔助等用途。
+        ## ⚙️ 主要功能
+        - 支援從多個單字庫中選擇，如：`common3000`, `business_words`。
+        - 可自訂抽取單字數量。
+        - 每個單字自動生成一個簡單的英文例句，適合初學者學習。
+        ## 📚 使用方式
+        1. 選擇單字庫（例如：`common3000`）。
+        2. 設定抽取單字數量（例如：10個）。
+        3. 點擊「生成例句」按鈕，即可獲得單字 + 音標 + 例句。
+        ## 🗂️ 資料來源
+        - **common3000**：常用3000單字表，附音標。
+        - 未來可能會有更多單字庫新增至 `/data/` 資料夾。（可能啦！
+        ## 🛠️ 技術架構
+        - **Gradio Blocks** 前端介面 + API。
+        - **Hugging Face Transformers** 語言模型：
+            - 模型：`EleutherAI/pythia-410m`（小型 GPT 模型）
+        ## 👨‍💻 開發者資訊
+        - 開發者：余彦志 (大宇 ian)
+        - 信箱：dayuian@hotmail.com
+        - GitHub：[https://github.com/dayuian](https://github.com/dayuian)
+        """
+    )
+    source_dropdown = gr.Dropdown(
+        choices=get_sources(),
+        value="common3000",
+        label="選擇單字庫",
+        interactive=True
+    )
+    num_input = gr.Number(value=10, label="抽幾個單字")
+    result_output = gr.HTML(label="生成結果")
+    status_output = gr.Textbox(label="狀態更新", lines=8, interactive=False)
+    submit_btn = gr.Button("生成例句")
+    submit_btn.click(
+        fn=get_words_with_sentences,
+        inputs=[source_dropdown, num_input],
+        outputs=[result_output, status_output]
+    )
 demo.launch()