Spaces:

Hieucyber2208
/

know-flow

Running

App Files Files Community

Hieucyber2208 commited on Feb 24

Commit

a0510b2

verified ·

1 Parent(s): 68e252e

Delete notebook

Browse files

Files changed (4) hide show

notebook/image_gen.ipynb +0 -190
notebook/text_preprocessing.ipynb +0 -247
notebook/text_to_speech.ipynb +0 -224
notebook/text_to_video.ipynb +0 -0

notebook/image_gen.ipynb DELETED Viewed

@@ -1,190 +0,0 @@
-{
- "cells": [
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from huggingface_hub import InferenceClient\n",
-    "import os\n",
-    "import glob\n",
-    "from collections import defaultdict\n",
-    "import google.generativeai as genai\n",
-    "from tqdm import tqdm\n",
-    "from huggingface_hub.utils import HfHubHTTPError\n",
-    "import random\n",
-    "from dotenv import load_dotenv\n",
-    "import time\n",
-    "\n",
-    "\n",
-    "load_dotenv()\n",
-    "HF_API_KEY = os.getenv(\"HUGGINGFACE_API_KEY\")\n",
-    "GOOGLE_API_KEY = os.getenv(\"GOOGLE_API_KEY\")\n",
-    "genai.configure(api_key=GOOGLE_API_KEY)\n",
-    "client = InferenceClient(provider=\"hf-inference\", api_key=HF_API_KEY)\n",
-    "import time"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "def split_text_by_semantics(number_of_images):\n",
-    "    with open(\"../data/text/text.txt\", \"r\", encoding=\"utf-8\") as file:\n",
-    "        text = file.read()\n",
-    "    prompt = f\"\"\"\n",
-    "    Bạn là một chuyên gia xử lý văn bản. Hãy chia văn bản sau thành {number_of_images} đoạn có ý nghĩa sao cho mỗi đoạn vừa đủ để giải thích trong khoảng 3 đến 5 câu.\n",
-    "\n",
-    "    Văn bản:\n",
-    "    {text}\n",
-    "\n",
-    "    Định dạng đầu ra:\n",
-    "    - Phần 1: [Nội dung]\n",
-    "    - Phần 2: [Nội dung]\n",
-    "    - Phần 3: [Nội dung]\n",
-    "    \"\"\"\n",
-    "\n",
-    "    try:\n",
-    "        model = genai.GenerativeModel(\"gemini-pro\")\n",
-    "        response = model.generate_content(prompt)\n",
-    "        result_text = response.text.strip()\n",
-    "\n",
-    "        chunks = result_text.split(\"- Phần \")\n",
-    "        chunks = [chunk.strip() for chunk in chunks if chunk]\n",
-    "        return chunks\n",
-    "    except Exception as e:\n",
-    "        print(f\"Lỗi khi gọi API Gemini: {e}\")\n",
-    "        return []"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "def describe_image(description, detail_level=\"short\", perspective=\"neutral\", emotion=None, time_setting=None, art_style=None):\n",
-    "    \"\"\"\n",
-    "    Nhận một đoạn văn mô tả chi tiết và trả về một câu mô tả hình ảnh theo các tùy chỉnh.\n",
-    "\n",
-    "    Args:\n",
-    "        description (str): Đoạn văn mô tả chi tiết.\n",
-    "        detail_level (str): Mức độ chi tiết (\"short\" hoặc \"detailed\").\n",
-    "        perspective (str): Góc nhìn (\"subjective\" hoặc \"neutral\").\n",
-    "        emotion (str, optional): Cảm xúc chủ đạo (nếu có, ví dụ: \"mysterious\", \"romantic\").\n",
-    "        time_setting (str, optional): Bối cảnh thời gian (ví dụ: \"modern\", \"medieval\", \"futuristic\").\n",
-    "        art_style (str, optional): Phong cách nghệ thuật (ví dụ: \"realistic\", \"abstract\", \"sketch\").\n",
-    "\n",
-    "    Returns:\n",
-    "        str: Một câu mô tả hình ảnh theo yêu cầu.\n",
-    "    \"\"\"\n",
-    "    \n",
-    "    prompt = f\"\"\"\n",
-    "    Bạn là chuyên gia mô tả hình ảnh. Hãy đọc đoạn mô tả dưới đây và tạo một mô tả hình ảnh theo các tiêu chí sau:\n",
-    "    - Mức độ chi tiết: {\"Ngắn gọn\" if detail_level == \"short\" else \"Chi tiết\"}.\n",
-    "    - Góc nhìn: {\"Chủ quan\" if perspective == \"subjective\" else \"Trung lập\"}.\n",
-    "    {f\"- Cảm xúc chủ đạo: {emotion}.\" if emotion else \"\"}\n",
-    "    {f\"- Bối cảnh thời gian: {time_setting}.\" if time_setting else \"\"}\n",
-    "    {f\"- Phong cách nghệ thuật: {art_style}.\" if art_style else \"\"}\n",
-    "\n",
-    "    Đoạn mô tả:\n",
-    "    {description}\n",
-    "\n",
-    "    Hãy tạo một mô tả hình ảnh phù hợp với yêu cầu trên bằng Tiếng Anh.\n",
-    "    \"\"\"\n",
-    "\n",
-    "    try:\n",
-    "        model = genai.GenerativeModel(\"gemini-pro\")\n",
-    "        response = model.generate_content(prompt)\n",
-    "        return response.text.strip()\n",
-    "    except Exception as e:\n",
-    "        print(f\"Lỗi khi gọi API Gemini: {e}\")\n",
-    "        return \"\"\n"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "def generate_image(prompt, output_path, model=\"stabilityai/stable-diffusion-3.5-large\", resolution=(512, 512), style=None, color_palette=None):\n",
-    "    \"\"\"\n",
-    "    Tạo hình ảnh từ mô tả văn bản với các tùy chỉnh linh hoạt.\n",
-    "    \n",
-    "    :param prompt: Mô tả hình ảnh đầu vào.\n",
-    "    :param output_path: Đường dẫn lưu ảnh đầu ra.\n",
-    "    :param model: Mô hình AI sử dụng để tạo ảnh.\n",
-    "    :param style: Phong cách hình ảnh (nếu có, ví dụ: 'realistic', 'anime', 'cyberpunk').\n",
-    "    :param color_palette: Bảng màu ưu tiên (nếu có, ví dụ: 'vibrant', 'monochrome').\n",
-    "    \"\"\"\n",
-    "    \n",
-    "    custom_prompt = prompt\n",
-    "    \n",
-    "    if style:\n",
-    "        custom_prompt += f\" in {style} style\"\n",
-    "    if color_palette:\n",
-    "        custom_prompt += f\" with {color_palette} color scheme\"\n",
-    "    \n",
-    "    image = client.text_to_image(custom_prompt, model=model, resolution=resolution)\n",
-    "    image.save(output_path)\n"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "texts = split_text_by_semantics(number_of_images=3)\n",
-    "index = 0\n",
-    "for merged_text in tqdm(texts, desc=\"Processing\", unit=\"image\"):\n",
-    "    output_path = f\"../data/image/{index}.png\"\n",
-    "    prompt = describe_image(merged_text)\n",
-    "    print(prompt)\n",
-    "\n",
-    "    # Cơ chế retry với backoff\n",
-    "    max_retries = 5\n",
-    "    retry_count = 0\n",
-    "\n",
-    "    while retry_count < max_retries:\n",
-    "        try:\n",
-    "            generate_image(prompt, output_path)\n",
-    "            time.sleep(60)  # Chờ sau khi tạo ảnh thành công\n",
-    "            break  # Nếu thành công thì thoát khỏi vòng lặp retry\n",
-    "        except HfHubHTTPError as e:\n",
-    "            print(f\"Lỗi khi gọi API: {e}\")\n",
-    "            retry_count += 1\n",
-    "            wait_time = 2 ** retry_count + random.uniform(0, 1)  # Exponential backoff\n",
-    "            print(f\"Thử lại sau {wait_time:.2f} giây...\")\n",
-    "            time.sleep(wait_time)\n",
-    "\n",
-    "    index += 1"
-   ]
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "base",
-   "language": "python",
-   "name": "python3"
-  },
-  "language_info": {
-   "codemirror_mode": {
-    "name": "ipython",
-    "version": 3
-   },
-   "file_extension": ".py",
-   "mimetype": "text/x-python",
-   "name": "python",
-   "nbconvert_exporter": "python",
-   "pygments_lexer": "ipython3",
-   "version": "3.12.7"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 2
-}

notebook/text_preprocessing.ipynb DELETED Viewed

@@ -1,247 +0,0 @@
-{
- "cells": [
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "# Cài đặt thư viện\n",
-    "API Free của Gemini nên không cần private"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 1,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import os\n",
-    "import fitz  # PyMuPDF\n",
-    "from docx import Document\n",
-    "import google.generativeai as genai\n",
-    "from dotenv import load_dotenv\n",
-    "\n",
-    "# Load biến môi trường từ .env\n",
-    "load_dotenv()\n",
-    "GOOGLE_API_KEY = os.getenv(\"GOOGLE_API_KEY\")\n",
-    "genai.configure(api_key=GOOGLE_API_KEY)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "# Thiết lập hàm đọc file\n",
-    "Chấp nhận hai định dạng là .doc và .pdf. Đảm bảo file bài giảng nhiều chữ."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 2,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "def extract_text_from_pdf(pdf_path):\n",
-    "    # Mở file PDF\n",
-    "    doc = fitz.open(pdf_path)\n",
-    "    text = \"\"\n",
-    "    for page_num in range(doc.page_count):\n",
-    "        page = doc.load_page(page_num)\n",
-    "        text += page.get_text()\n",
-    "    return text\n",
-    "\n",
-    "def extract_text_from_docx(docx_path):\n",
-    "    # Mở file DOCX\n",
-    "    doc = Document(docx_path)\n",
-    "    text = \"\"\n",
-    "    for para in doc.paragraphs:\n",
-    "        text += para.text + \"\\n\"\n",
-    "    return text\n",
-    "\n",
-    "def extract_text_from_file(file_path):\n",
-    "    # Kiểm tra loại file và gọi hàm tương ứng\n",
-    "    file_extension = os.path.splitext(file_path)[1].lower()\n",
-    "\n",
-    "    if file_extension == '.pdf':\n",
-    "        return extract_text_from_pdf(file_path)\n",
-    "    elif file_extension == '.docx':\n",
-    "        return extract_text_from_docx(file_path)\n",
-    "    else:\n",
-    "        raise ValueError(\"Unsupported file format. Only PDF and DOCX are supported.\")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 4,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "text = extract_text_from_file(\"../data/input/sample.pdf\")\n",
-    "with open(\"../data/text/text.txt\", \"w\", encoding=\"utf-8\") as f:\n",
-    "    f.write(text)  "
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "# Gọi API tiến hành chia đoạn và phân tích tóm tắt\n",
-    "Đưa ra phân tích và lưu lại file"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "def split_text_by_semantics(text, number_of_chunks):\n",
-    "    prompt = f\"\"\"\n",
-    "    Bạn là một chuyên gia xử lý văn bản. Hãy chia văn bản sau thành {number_of_chunks} đoạn có ý nghĩa sao cho mỗi đoạn vừa đủ để giải thích trong khoảng 3 đến 5 câu.\n",
-    "\n",
-    "    Văn bản:\n",
-    "    {text}\n",
-    "\n",
-    "    Định dạng đầu ra:\n",
-    "    - Phần 1: [Nội dung]\n",
-    "    - Phần 2: [Nội dung]\n",
-    "    - Phần 3: [Nội dung]\n",
-    "    \"\"\"\n",
-    "\n",
-    "    try:\n",
-    "        model = genai.GenerativeModel(\"gemini-pro\")\n",
-    "        response = model.generate_content(prompt)\n",
-    "        result_text = response.text.strip()\n",
-    "\n",
-    "        chunks = result_text.split(\"- Phần \")\n",
-    "        chunks = [chunk.strip() for chunk in chunks if chunk]\n",
-    "        return chunks\n",
-    "    except Exception as e:\n",
-    "        print(f\"Lỗi khi gọi API Gemini: {e}\")\n",
-    "        return []"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "def generate_explaination_for_chunks(chunks, analysis_level='basic', style='academic', word_limit=100):\n",
-    "    \"\"\"\n",
-    "    Phân tích nội dung của văn bản theo mức độ và phong cách mong muốn.\n",
-    "    \n",
-    "    :param chunks: Danh sách các đoạn văn bản cần phân tích.\n",
-    "    :param text: Toàn bộ văn bản gốc.\n",
-    "    :param analysis_level: Mức độ phân tích ('basic' hoặc 'detailed').\n",
-    "    :param style: Phong cách phân tích ('academic', 'popular', 'creative', 'humorous').\n",
-    "    :param word_limit: Số từ ước lượng cho mỗi phần tóm tắt.\n",
-    "    :return: Danh sách các phân tích tương ứng với từng đoạn.\n",
-    "    \"\"\"\n",
-    "    \n",
-    "    level_prompts = {\n",
-    "        'basic': \"Hãy đưa ra một bản tóm tắt ngắn gọn, tập trung vào nội dung chính.\",\n",
-    "        'detailed': \"Hãy phân tích chuyên sâu từng phần, làm rõ ý nghĩa, ngữ cảnh và các yếu tố quan trọng.\"\n",
-    "    }\n",
-    "    \n",
-    "    style_prompts = {\n",
-    "        'academic': \"Phân tích theo phong cách học thuật, sử dụng ngôn ngữ chuyên sâu và lập luận chặt chẽ.\",\n",
-    "        'popular': \"Trình bày theo phong cách phổ thông, dễ hiểu và phù hợp với nhiều đối tượng.\",\n",
-    "        'creative': \"Giải thích một cách sáng tạo, sử dụng hình ảnh ẩn dụ và cách diễn đạt thú vị.\",\n",
-    "        'humorous': \"Phân tích theo phong cách hài hước, thêm vào yếu tố vui nhộn và bất ngờ.\"\n",
-    "    }\n",
-    "    \n",
-    "    overview_prompt = f\"\"\"\n",
-    "    Đây là một văn bản có nội dung quan trọng. Bạn sẽ phân tích từng phần theo mức độ '{analysis_level}' và phong cách '{style}'.\n",
-    "    Văn bản gồm các phần sau: {', '.join([f'Phần {i+1}' for i in range(len(chunks))])}.\n",
-    "    {level_prompts[analysis_level]}\n",
-    "    {style_prompts[style]}\n",
-    "    Mỗi phần không vượt quá {word_limit} từ.\n",
-    "    \"\"\"\n",
-    "    \n",
-    "    try:\n",
-    "        model = genai.GenerativeModel(\"gemini-pro\")\n",
-    "        response = model.generate_content(overview_prompt)\n",
-    "        overview_text = response.text.strip()\n",
-    "        \n",
-    "        explanations = []\n",
-    "        for idx, chunk in enumerate(chunks, start=1):\n",
-    "            part_prompt = f\"\"\"\n",
-    "            Phân tích phần {idx} của văn bản.\n",
-    "            {level_prompts[analysis_level]}\n",
-    "            {style_prompts[style]}\n",
-    "            Nội dung phần này:\n",
-    "            {chunk}\n",
-    "            Hãy đảm bảo phần tóm tắt không vượt quá {word_limit} từ.\n",
-    "            \"\"\"\n",
-    "            \n",
-    "            part_response = model.generate_content(part_prompt)\n",
-    "            explanations.append(part_response.text.strip())\n",
-    "        \n",
-    "        return explanations\n",
-    "    \n",
-    "    except Exception as e:\n",
-    "        print(f\"Lỗi khi gọi API Gemini: {e}\")\n",
-    "        return []"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Tách văn bản theo ngữ nghĩa sử dụng API Gemini\n",
-    "semantic_chunks = split_text_by_semantics(text, number_of_chunks=3)\n",
-    "\n",
-    "# Tạo thuyết minh cho từng phần semantic chunk\n",
-    "explainations = generate_explaination_for_chunks(semantic_chunks)\n",
-    "\n",
-    "# In kết quả\n",
-    "for idx, explaination in enumerate(explainations, start=1):\n",
-    "    print(f\"Giải thích cho Phần {idx}:\\n{explaination}\\n\")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Lưu từng câu vào tệp riêng biệt\n",
-    "for idx, explaination in enumerate(explainations, start=1):\n",
-    "    # Tách đoạn văn bản thành các câu dựa trên dấu chấm\n",
-    "    sentences = explaination.split('.')\n",
-    "    \n",
-    "    # Lưu từng câu vào tệp riêng biệt\n",
-    "    for sentence_idx, sentence in enumerate(sentences, start=1):\n",
-    "        sentence = sentence.strip()  # Loại bỏ khoảng trắng thừa\n",
-    "        if sentence:  # Kiểm tra nếu câu không rỗng\n",
-    "            output_file = f\"../data/text/{idx}_{sentence_idx}.txt\"  # Tên tệp theo định dạng x_y.txt\n",
-    "            with open(output_file, \"w\", encoding=\"utf-8\") as f:\n",
-    "                f.write(f\"'{sentence}'\")  # Ghi câu trong dấu nháy đơn\n",
-    "            print(f\"Đã lưu: {output_file}\")"
-   ]
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "base",
-   "language": "python",
-   "name": "python3"
-  },
-  "language_info": {
-   "codemirror_mode": {
-    "name": "ipython",
-    "version": 3
-   },
-   "file_extension": ".py",
-   "mimetype": "text/x-python",
-   "name": "python",
-   "nbconvert_exporter": "python",
-   "pygments_lexer": "ipython3",
-   "version": "3.12.7"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 2
-}

notebook/text_to_speech.ipynb DELETED Viewed

@@ -1,224 +0,0 @@
-{
- "cells": [
-  {
-   "cell_type": "code",
-   "execution_count": 6,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import torch\n",
-    "from transformers import VitsModel, AutoTokenizer\n",
-    "import torchaudio\n",
-    "import numpy as np\n",
-    "import os\n",
-    "from gtts import gTTS"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 11,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Đọc và load danh sách từ các file .txt trong thư mục ../data/text\n",
-    "text_folder = \"../data/text\"\n",
-    "text_files = sorted([f for f in os.listdir(text_folder) if f.endswith('.txt')])  # Lọc các file .txt trong thư mục"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 9,
-   "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "✅ Audio saved as hello.mp3 (gTTS - Female)\n"
-     ]
-    }
-   ],
-   "source": [
-    "def text_to_speech(text, filename=\"output.mp3\", gender=\"female\", speed=\"normal\"):\n",
-    "    \"\"\"\n",
-    "    Convert text to speech and save it as an audio file.\n",
-    "    \n",
-    "    Parameters:\n",
-    "        text (str): The text to convert.\n",
-    "        filename (str): The output file name.\n",
-    "        gender (str): \"male\" (use MMS-TTS) or \"female\" (use gTTS).\n",
-    "        speed (str): \"slow\", \"normal\", or \"fast\" (only for gTTS).\n",
-    "    \"\"\"\n",
-    "    lang = \"vi\"\n",
-    "    \n",
-    "    if gender.lower() == \"female\":\n",
-    "        # gTTS chỉ có giọng nữ\n",
-    "        speed_mapping = {\"slow\": True, \"normal\": False, \"fast\": False}\n",
-    "        slow = speed_mapping.get(speed.lower(), False)\n",
-    "        \n",
-    "        tts = gTTS(text=text, lang=lang, slow=slow)\n",
-    "        tts.save(filename)\n",
-    "        print(f\"✅ Audio saved as {filename}\")\n",
-    "    \n",
-    "    elif gender.lower() == \"male\":\n",
-    "        # MMS-TTS cho giọng nam\n",
-    "        model = VitsModel.from_pretrained(\"facebook/mms-tts-vie\")\n",
-    "        tokenizer = AutoTokenizer.from_pretrained(\"facebook/mms-tts-vie\")\n",
-    "        \n",
-    "        inputs = tokenizer(text, return_tensors=\"pt\")\n",
-    "        with torch.no_grad():\n",
-    "            output = model(**inputs).waveform\n",
-    "        \n",
-    "        # Lưu file âm thanh\n",
-    "        torchaudio.save(filename, output, 24000)\n",
-    "        print(f\"✅ Audio saved as {filename}\")\n",
-    "    \n",
-    "    else:\n",
-    "        print(\"⚠️ Giọng không hợp lệ! Chỉ hỗ trợ 'male' hoặc 'female'.\")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 12,
-   "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "✅ Audio saved as 1_1.wav (gTTS - Female)\n",
-      "Đã lưu 1_1.wav\n",
-      "✅ Audio saved as 1_10.wav (gTTS - Female)\n",
-      "Đã lưu 1_10.wav\n",
-      "✅ Audio saved as 1_11.wav (gTTS - Female)\n",
-      "Đã lưu 1_11.wav\n",
-      "✅ Audio saved as 1_12.wav (gTTS - Female)\n",
-      "Đã lưu 1_12.wav\n",
-      "✅ Audio saved as 1_13.wav (gTTS - Female)\n",
-      "Đã lưu 1_13.wav\n",
-      "✅ Audio saved as 1_14.wav (gTTS - Female)\n",
-      "Đã lưu 1_14.wav\n",
-      "✅ Audio saved as 1_15.wav (gTTS - Female)\n",
-      "Đã lưu 1_15.wav\n",
-      "✅ Audio saved as 1_16.wav (gTTS - Female)\n",
-      "Đã lưu 1_16.wav\n",
-      "✅ Audio saved as 1_17.wav (gTTS - Female)\n",
-      "Đã lưu 1_17.wav\n",
-      "✅ Audio saved as 1_2.wav (gTTS - Female)\n",
-      "Đã lưu 1_2.wav\n",
-      "✅ Audio saved as 1_3.wav (gTTS - Female)\n",
-      "Đã lưu 1_3.wav\n",
-      "✅ Audio saved as 1_4.wav (gTTS - Female)\n",
-      "Đã lưu 1_4.wav\n",
-      "✅ Audio saved as 1_5.wav (gTTS - Female)\n",
-      "Đã lưu 1_5.wav\n",
-      "✅ Audio saved as 1_6.wav (gTTS - Female)\n",
-      "Đã lưu 1_6.wav\n",
-      "✅ Audio saved as 1_7.wav (gTTS - Female)\n",
-      "Đã lưu 1_7.wav\n",
-      "✅ Audio saved as 1_8.wav (gTTS - Female)\n",
-      "Đã lưu 1_8.wav\n",
-      "✅ Audio saved as 1_9.wav (gTTS - Female)\n",
-      "Đã lưu 1_9.wav\n",
-      "✅ Audio saved as 2_1.wav (gTTS - Female)\n",
-      "Đã lưu 2_1.wav\n",
-      "✅ Audio saved as 2_10.wav (gTTS - Female)\n",
-      "Đã lưu 2_10.wav\n",
-      "✅ Audio saved as 2_11.wav (gTTS - Female)\n",
-      "Đã lưu 2_11.wav\n",
-      "✅ Audio saved as 2_12.wav (gTTS - Female)\n",
-      "Đã lưu 2_12.wav\n",
-      "✅ Audio saved as 2_13.wav (gTTS - Female)\n",
-      "Đã lưu 2_13.wav\n",
-      "✅ Audio saved as 2_14.wav (gTTS - Female)\n",
-      "Đã lưu 2_14.wav\n",
-      "✅ Audio saved as 2_15.wav (gTTS - Female)\n",
-      "Đã lưu 2_15.wav\n",
-      "✅ Audio saved as 2_16.wav (gTTS - Female)\n",
-      "Đã lưu 2_16.wav\n",
-      "✅ Audio saved as 2_17.wav (gTTS - Female)\n",
-      "Đã lưu 2_17.wav\n",
-      "✅ Audio saved as 2_18.wav (gTTS - Female)\n",
-      "Đã lưu 2_18.wav\n",
-      "✅ Audio saved as 2_2.wav (gTTS - Female)\n",
-      "Đã lưu 2_2.wav\n",
-      "✅ Audio saved as 2_3.wav (gTTS - Female)\n",
-      "Đã lưu 2_3.wav\n",
-      "✅ Audio saved as 2_4.wav (gTTS - Female)\n",
-      "Đã lưu 2_4.wav\n",
-      "✅ Audio saved as 2_5.wav (gTTS - Female)\n",
-      "Đã lưu 2_5.wav\n",
-      "✅ Audio saved as 2_6.wav (gTTS - Female)\n",
-      "Đã lưu 2_6.wav\n",
-      "✅ Audio saved as 2_7.wav (gTTS - Female)\n",
-      "Đã lưu 2_7.wav\n",
-      "✅ Audio saved as 2_8.wav (gTTS - Female)\n",
-      "Đã lưu 2_8.wav\n",
-      "✅ Audio saved as 2_9.wav (gTTS - Female)\n",
-      "Đã lưu 2_9.wav\n",
-      "✅ Audio saved as 3_1.wav (gTTS - Female)\n",
-      "Đã lưu 3_1.wav\n",
-      "✅ Audio saved as 3_10.wav (gTTS - Female)\n",
-      "Đã lưu 3_10.wav\n",
-      "✅ Audio saved as 3_11.wav (gTTS - Female)\n",
-      "Đã lưu 3_11.wav\n",
-      "✅ Audio saved as 3_12.wav (gTTS - Female)\n",
-      "Đã lưu 3_12.wav\n",
-      "✅ Audio saved as 3_14.wav (gTTS - Female)\n",
-      "Đã lưu 3_14.wav\n",
-      "✅ Audio saved as 3_17.wav (gTTS - Female)\n",
-      "Đã lưu 3_17.wav\n",
-      "✅ Audio saved as 3_18.wav (gTTS - Female)\n",
-      "Đã lưu 3_18.wav\n",
-      "✅ Audio saved as 3_19.wav (gTTS - Female)\n",
-      "Đã lưu 3_19.wav\n",
-      "✅ Audio saved as 3_2.wav (gTTS - Female)\n",
-      "Đã lưu 3_2.wav\n",
-      "✅ Audio saved as 3_3.wav (gTTS - Female)\n",
-      "Đã lưu 3_3.wav\n",
-      "✅ Audio saved as 3_4.wav (gTTS - Female)\n",
-      "Đã lưu 3_4.wav\n",
-      "✅ Audio saved as 3_5.wav (gTTS - Female)\n",
-      "Đã lưu 3_5.wav\n",
-      "✅ Audio saved as 3_6.wav (gTTS - Female)\n",
-      "Đã lưu 3_6.wav\n",
-      "✅ Audio saved as 3_7.wav (gTTS - Female)\n",
-      "Đã lưu 3_7.wav\n",
-      "✅ Audio saved as 3_8.wav (gTTS - Female)\n",
-      "Đã lưu 3_8.wav\n",
-      "✅ Audio saved as 3_9.wav (gTTS - Female)\n",
-      "Đã lưu 3_9.wav\n"
-     ]
-    }
-   ],
-   "source": [
-    "for text_file in text_files:\n",
-    "    with open(f\"../data/text/{text_file}\", \"r\", encoding=\"utf-8\") as file:\n",
-    "        content = file.read()\n",
-    "    audio_file = text_file.replace(\"txt\",\"wav\")\n",
-    "    text_to_speech(content, audio_file)"
-   ]
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "base",
-   "language": "python",
-   "name": "python3"
-  },
-  "language_info": {
-   "codemirror_mode": {
-    "name": "ipython",
-    "version": 3
-   },
-   "file_extension": ".py",
-   "mimetype": "text/x-python",
-   "name": "python",
-   "nbconvert_exporter": "python",
-   "pygments_lexer": "ipython3",
-   "version": "3.12.7"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 2
-}

notebook/text_to_video.ipynb DELETED Viewed

The diff for this file is too large to render. See raw diff