Spaces:

neelimapreeti297
/

GermanToEnglish

Runtime error

App Files Files Community

neelimapreeti297 commited on Apr 6, 2024

Commit

f394198

verified ·

1 Parent(s): 96da389

Upload germanToEnglish.ipynb

Browse files

Files changed (1) hide show

germanToEnglish.ipynb +1205 -0

germanToEnglish.ipynb ADDED Viewed

	@@ -0,0 +1,1205 @@

+{
+  "cells": [
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {
+        "id": "wsIPzMNfW3QH"
+      },
+      "outputs": [],
+      "source": [
+        "from torchtext.data.utils import get_tokenizer\n",
+        "from torchtext.vocab import build_vocab_from_iterator\n",
+        "from torchtext.datasets import multi30k, Multi30k\n",
+        "from typing import Iterable, List\n",
+        "\n",
+        "\n",
+        "# We need to modify the URLs for the dataset since the links to the original dataset are broken\n",
+        "# Refer to https://github.com/pytorch/text/issues/1756#issuecomment-1163664163 for more info\n",
+        "multi30k.URL[\"train\"] = \"https://raw.githubusercontent.com/neychev/small_DL_repo/master/datasets/Multi30k/training.tar.gz\"\n",
+        "multi30k.URL[\"valid\"] = \"https://raw.githubusercontent.com/neychev/small_DL_repo/master/datasets/Multi30k/validation.tar.gz\"\n",
+        "\n",
+        "SRC_LANGUAGE = 'de'\n",
+        "TGT_LANGUAGE = 'en'\n",
+        "\n",
+        "# Place-holders\n",
+        "token_transform = {}\n",
+        "vocab_transform = {}"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {
+        "colab": {
+          "base_uri": "https://localhost:8080/"
+        },
+        "id": "T8LEEOd2r-PV",
+        "outputId": "33e10bf6-dd1f-4760-ae2a-5fffd2996edb"
+      },
+      "outputs": [
+        {
+          "name": "stdout",
+          "output_type": "stream",
+          "text": [
+            "Drive already mounted at /gdrive; to attempt to forcibly remount, call drive.mount(\"/gdrive\", force_remount=True).\n"
+          ]
+        }
+      ],
+      "source": [
+        "from google.colab import drive\n",
+        "drive.mount('/gdrive')"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {
+        "colab": {
+          "base_uri": "https://localhost:8080/"
+        },
+        "id": "mRx_hiQnLGjV",
+        "outputId": "90fe1bbb-76b7-489b-e864-1b41ffbbeeef"
+      },
+      "outputs": [
+        {
+          "name": "stdout",
+          "output_type": "stream",
+          "text": [
+            "Requirement already satisfied: torchdata in /usr/local/lib/python3.10/dist-packages (0.7.1)\n",
+            "Requirement already satisfied: urllib3>=1.25 in /usr/local/lib/python3.10/dist-packages (from torchdata) (2.0.7)\n",
+            "Requirement already satisfied: requests in /usr/local/lib/python3.10/dist-packages (from torchdata) (2.31.0)\n",
+            "Requirement already satisfied: torch>=2 in /usr/local/lib/python3.10/dist-packages (from torchdata) (2.2.1+cu121)\n",
+            "Requirement already satisfied: filelock in /usr/local/lib/python3.10/dist-packages (from torch>=2->torchdata) (3.13.3)\n",
+            "Requirement already satisfied: typing-extensions>=4.8.0 in /usr/local/lib/python3.10/dist-packages (from torch>=2->torchdata) (4.10.0)\n",
+            "Requirement already satisfied: sympy in /usr/local/lib/python3.10/dist-packages (from torch>=2->torchdata) (1.12)\n",
+            "Requirement already satisfied: networkx in /usr/local/lib/python3.10/dist-packages (from torch>=2->torchdata) (3.2.1)\n",
+            "Requirement already satisfied: jinja2 in /usr/local/lib/python3.10/dist-packages (from torch>=2->torchdata) (3.1.3)\n",
+            "Requirement already satisfied: fsspec in /usr/local/lib/python3.10/dist-packages (from torch>=2->torchdata) (2023.6.0)\n",
+            "Requirement already satisfied: nvidia-cuda-nvrtc-cu12==12.1.105 in /usr/local/lib/python3.10/dist-packages (from torch>=2->torchdata) (12.1.105)\n",
+            "Requirement already satisfied: nvidia-cuda-runtime-cu12==12.1.105 in /usr/local/lib/python3.10/dist-packages (from torch>=2->torchdata) (12.1.105)\n",
+            "Requirement already satisfied: nvidia-cuda-cupti-cu12==12.1.105 in /usr/local/lib/python3.10/dist-packages (from torch>=2->torchdata) (12.1.105)\n",
+            "Requirement already satisfied: nvidia-cudnn-cu12==8.9.2.26 in /usr/local/lib/python3.10/dist-packages (from torch>=2->torchdata) (8.9.2.26)\n",
+            "Requirement already satisfied: nvidia-cublas-cu12==12.1.3.1 in /usr/local/lib/python3.10/dist-packages (from torch>=2->torchdata) (12.1.3.1)\n",
+            "Requirement already satisfied: nvidia-cufft-cu12==11.0.2.54 in /usr/local/lib/python3.10/dist-packages (from torch>=2->torchdata) (11.0.2.54)\n",
+            "Requirement already satisfied: nvidia-curand-cu12==10.3.2.106 in /usr/local/lib/python3.10/dist-packages (from torch>=2->torchdata) (10.3.2.106)\n",
+            "Requirement already satisfied: nvidia-cusolver-cu12==11.4.5.107 in /usr/local/lib/python3.10/dist-packages (from torch>=2->torchdata) (11.4.5.107)\n",
+            "Requirement already satisfied: nvidia-cusparse-cu12==12.1.0.106 in /usr/local/lib/python3.10/dist-packages (from torch>=2->torchdata) (12.1.0.106)\n",
+            "Requirement already satisfied: nvidia-nccl-cu12==2.19.3 in /usr/local/lib/python3.10/dist-packages (from torch>=2->torchdata) (2.19.3)\n",
+            "Requirement already satisfied: nvidia-nvtx-cu12==12.1.105 in /usr/local/lib/python3.10/dist-packages (from torch>=2->torchdata) (12.1.105)\n",
+            "Requirement already satisfied: triton==2.2.0 in /usr/local/lib/python3.10/dist-packages (from torch>=2->torchdata) (2.2.0)\n",
+            "Requirement already satisfied: nvidia-nvjitlink-cu12 in /usr/local/lib/python3.10/dist-packages (from nvidia-cusolver-cu12==11.4.5.107->torch>=2->torchdata) (12.4.127)\n",
+            "Requirement already satisfied: charset-normalizer<4,>=2 in /usr/local/lib/python3.10/dist-packages (from requests->torchdata) (3.3.2)\n",
+            "Requirement already satisfied: idna<4,>=2.5 in /usr/local/lib/python3.10/dist-packages (from requests->torchdata) (3.6)\n",
+            "Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.10/dist-packages (from requests->torchdata) (2024.2.2)\n",
+            "Requirement already satisfied: MarkupSafe>=2.0 in /usr/local/lib/python3.10/dist-packages (from jinja2->torch>=2->torchdata) (2.1.5)\n",
+            "Requirement already satisfied: mpmath>=0.19 in /usr/local/lib/python3.10/dist-packages (from sympy->torch>=2->torchdata) (1.3.0)\n",
+            "Requirement already satisfied: spacy in /usr/local/lib/python3.10/dist-packages (3.7.4)\n",
+            "Requirement already satisfied: spacy-legacy<3.1.0,>=3.0.11 in /usr/local/lib/python3.10/dist-packages (from spacy) (3.0.12)\n",
+            "Requirement already satisfied: spacy-loggers<2.0.0,>=1.0.0 in /usr/local/lib/python3.10/dist-packages (from spacy) (1.0.5)\n",
+            "Requirement already satisfied: murmurhash<1.1.0,>=0.28.0 in /usr/local/lib/python3.10/dist-packages (from spacy) (1.0.10)\n",
+            "Requirement already satisfied: cymem<2.1.0,>=2.0.2 in /usr/local/lib/python3.10/dist-packages (from spacy) (2.0.8)\n",
+            "Requirement already satisfied: preshed<3.1.0,>=3.0.2 in /usr/local/lib/python3.10/dist-packages (from spacy) (3.0.9)\n",
+            "Requirement already satisfied: thinc<8.3.0,>=8.2.2 in /usr/local/lib/python3.10/dist-packages (from spacy) (8.2.3)\n",
+            "Requirement already satisfied: wasabi<1.2.0,>=0.9.1 in /usr/local/lib/python3.10/dist-packages (from spacy) (1.1.2)\n",
+            "Requirement already satisfied: srsly<3.0.0,>=2.4.3 in /usr/local/lib/python3.10/dist-packages (from spacy) (2.4.8)\n",
+            "Requirement already satisfied: catalogue<2.1.0,>=2.0.6 in /usr/local/lib/python3.10/dist-packages (from spacy) (2.0.10)\n",
+            "Requirement already satisfied: weasel<0.4.0,>=0.1.0 in /usr/local/lib/python3.10/dist-packages (from spacy) (0.3.4)\n",
+            "Requirement already satisfied: typer<0.10.0,>=0.3.0 in /usr/local/lib/python3.10/dist-packages (from spacy) (0.9.4)\n",
+            "Requirement already satisfied: smart-open<7.0.0,>=5.2.1 in /usr/local/lib/python3.10/dist-packages (from spacy) (6.4.0)\n",
+            "Requirement already satisfied: tqdm<5.0.0,>=4.38.0 in /usr/local/lib/python3.10/dist-packages (from spacy) (4.66.2)\n",
+            "Requirement already satisfied: requests<3.0.0,>=2.13.0 in /usr/local/lib/python3.10/dist-packages (from spacy) (2.31.0)\n",
+            "Requirement already satisfied: pydantic!=1.8,!=1.8.1,<3.0.0,>=1.7.4 in /usr/local/lib/python3.10/dist-packages (from spacy) (2.6.4)\n",
+            "Requirement already satisfied: jinja2 in /usr/local/lib/python3.10/dist-packages (from spacy) (3.1.3)\n",
+            "Requirement already satisfied: setuptools in /usr/local/lib/python3.10/dist-packages (from spacy) (67.7.2)\n",
+            "Requirement already satisfied: packaging>=20.0 in /usr/local/lib/python3.10/dist-packages (from spacy) (24.0)\n",
+            "Requirement already satisfied: langcodes<4.0.0,>=3.2.0 in /usr/local/lib/python3.10/dist-packages (from spacy) (3.3.0)\n",
+            "Requirement already satisfied: numpy>=1.19.0 in /usr/local/lib/python3.10/dist-packages (from spacy) (1.25.2)\n",
+            "Requirement already satisfied: annotated-types>=0.4.0 in /usr/local/lib/python3.10/dist-packages (from pydantic!=1.8,!=1.8.1,<3.0.0,>=1.7.4->spacy) (0.6.0)\n",
+            "Requirement already satisfied: pydantic-core==2.16.3 in /usr/local/lib/python3.10/dist-packages (from pydantic!=1.8,!=1.8.1,<3.0.0,>=1.7.4->spacy) (2.16.3)\n",
+            "Requirement already satisfied: typing-extensions>=4.6.1 in /usr/local/lib/python3.10/dist-packages (from pydantic!=1.8,!=1.8.1,<3.0.0,>=1.7.4->spacy) (4.10.0)\n",
+            "Requirement already satisfied: charset-normalizer<4,>=2 in /usr/local/lib/python3.10/dist-packages (from requests<3.0.0,>=2.13.0->spacy) (3.3.2)\n",
+            "Requirement already satisfied: idna<4,>=2.5 in /usr/local/lib/python3.10/dist-packages (from requests<3.0.0,>=2.13.0->spacy) (3.6)\n",
+            "Requirement already satisfied: urllib3<3,>=1.21.1 in /usr/local/lib/python3.10/dist-packages (from requests<3.0.0,>=2.13.0->spacy) (2.0.7)\n",
+            "Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.10/dist-packages (from requests<3.0.0,>=2.13.0->spacy) (2024.2.2)\n",
+            "Requirement already satisfied: blis<0.8.0,>=0.7.8 in /usr/local/lib/python3.10/dist-packages (from thinc<8.3.0,>=8.2.2->spacy) (0.7.11)\n",
+            "Requirement already satisfied: confection<1.0.0,>=0.0.1 in /usr/local/lib/python3.10/dist-packages (from thinc<8.3.0,>=8.2.2->spacy) (0.1.4)\n",
+            "Requirement already satisfied: click<9.0.0,>=7.1.1 in /usr/local/lib/python3.10/dist-packages (from typer<0.10.0,>=0.3.0->spacy) (8.1.7)\n",
+            "Requirement already satisfied: cloudpathlib<0.17.0,>=0.7.0 in /usr/local/lib/python3.10/dist-packages (from weasel<0.4.0,>=0.1.0->spacy) (0.16.0)\n",
+            "Requirement already satisfied: MarkupSafe>=2.0 in /usr/local/lib/python3.10/dist-packages (from jinja2->spacy) (2.1.5)\n"
+          ]
+        }
+      ],
+      "source": [
+        "!pip install -U torchdata\n",
+        "!pip install -U spacy"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {
+        "colab": {
+          "base_uri": "https://localhost:8080/"
+        },
+        "id": "WdqsXpFuzGrH",
+        "outputId": "f5402068-ed10-445e-82a6-9db4d11d310c"
+      },
+      "outputs": [
+        {
+          "name": "stdout",
+          "output_type": "stream",
+          "text": [
+            "Collecting en-core-web-sm==3.7.1\n",
+            "  Using cached https://github.com/explosion/spacy-models/releases/download/en_core_web_sm-3.7.1/en_core_web_sm-3.7.1-py3-none-any.whl (12.8 MB)\n",
+            "Requirement already satisfied: spacy<3.8.0,>=3.7.2 in /usr/local/lib/python3.10/dist-packages (from en-core-web-sm==3.7.1) (3.7.4)\n",
+            "Requirement already satisfied: spacy-legacy<3.1.0,>=3.0.11 in /usr/local/lib/python3.10/dist-packages (from spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (3.0.12)\n",
+            "Requirement already satisfied: spacy-loggers<2.0.0,>=1.0.0 in /usr/local/lib/python3.10/dist-packages (from spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (1.0.5)\n",
+            "Requirement already satisfied: murmurhash<1.1.0,>=0.28.0 in /usr/local/lib/python3.10/dist-packages (from spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (1.0.10)\n",
+            "Requirement already satisfied: cymem<2.1.0,>=2.0.2 in /usr/local/lib/python3.10/dist-packages (from spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (2.0.8)\n",
+            "Requirement already satisfied: preshed<3.1.0,>=3.0.2 in /usr/local/lib/python3.10/dist-packages (from spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (3.0.9)\n",
+            "Requirement already satisfied: thinc<8.3.0,>=8.2.2 in /usr/local/lib/python3.10/dist-packages (from spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (8.2.3)\n",
+            "Requirement already satisfied: wasabi<1.2.0,>=0.9.1 in /usr/local/lib/python3.10/dist-packages (from spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (1.1.2)\n",
+            "Requirement already satisfied: srsly<3.0.0,>=2.4.3 in /usr/local/lib/python3.10/dist-packages (from spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (2.4.8)\n",
+            "Requirement already satisfied: catalogue<2.1.0,>=2.0.6 in /usr/local/lib/python3.10/dist-packages (from spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (2.0.10)\n",
+            "Requirement already satisfied: weasel<0.4.0,>=0.1.0 in /usr/local/lib/python3.10/dist-packages (from spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (0.3.4)\n",
+            "Requirement already satisfied: typer<0.10.0,>=0.3.0 in /usr/local/lib/python3.10/dist-packages (from spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (0.9.4)\n",
+            "Requirement already satisfied: smart-open<7.0.0,>=5.2.1 in /usr/local/lib/python3.10/dist-packages (from spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (6.4.0)\n",
+            "Requirement already satisfied: tqdm<5.0.0,>=4.38.0 in /usr/local/lib/python3.10/dist-packages (from spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (4.66.2)\n",
+            "Requirement already satisfied: requests<3.0.0,>=2.13.0 in /usr/local/lib/python3.10/dist-packages (from spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (2.31.0)\n",
+            "Requirement already satisfied: pydantic!=1.8,!=1.8.1,<3.0.0,>=1.7.4 in /usr/local/lib/python3.10/dist-packages (from spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (2.6.4)\n",
+            "Requirement already satisfied: jinja2 in /usr/local/lib/python3.10/dist-packages (from spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (3.1.3)\n",
+            "Requirement already satisfied: setuptools in /usr/local/lib/python3.10/dist-packages (from spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (67.7.2)\n",
+            "Requirement already satisfied: packaging>=20.0 in /usr/local/lib/python3.10/dist-packages (from spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (24.0)\n",
+            "Requirement already satisfied: langcodes<4.0.0,>=3.2.0 in /usr/local/lib/python3.10/dist-packages (from spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (3.3.0)\n",
+            "Requirement already satisfied: numpy>=1.19.0 in /usr/local/lib/python3.10/dist-packages (from spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (1.25.2)\n",
+            "Requirement already satisfied: annotated-types>=0.4.0 in /usr/local/lib/python3.10/dist-packages (from pydantic!=1.8,!=1.8.1,<3.0.0,>=1.7.4->spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (0.6.0)\n",
+            "Requirement already satisfied: pydantic-core==2.16.3 in /usr/local/lib/python3.10/dist-packages (from pydantic!=1.8,!=1.8.1,<3.0.0,>=1.7.4->spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (2.16.3)\n",
+            "Requirement already satisfied: typing-extensions>=4.6.1 in /usr/local/lib/python3.10/dist-packages (from pydantic!=1.8,!=1.8.1,<3.0.0,>=1.7.4->spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (4.10.0)\n",
+            "Requirement already satisfied: charset-normalizer<4,>=2 in /usr/local/lib/python3.10/dist-packages (from requests<3.0.0,>=2.13.0->spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (3.3.2)\n",
+            "Requirement already satisfied: idna<4,>=2.5 in /usr/local/lib/python3.10/dist-packages (from requests<3.0.0,>=2.13.0->spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (3.6)\n",
+            "Requirement already satisfied: urllib3<3,>=1.21.1 in /usr/local/lib/python3.10/dist-packages (from requests<3.0.0,>=2.13.0->spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (2.0.7)\n",
+            "Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.10/dist-packages (from requests<3.0.0,>=2.13.0->spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (2024.2.2)\n",
+            "Requirement already satisfied: blis<0.8.0,>=0.7.8 in /usr/local/lib/python3.10/dist-packages (from thinc<8.3.0,>=8.2.2->spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (0.7.11)\n",
+            "Requirement already satisfied: confection<1.0.0,>=0.0.1 in /usr/local/lib/python3.10/dist-packages (from thinc<8.3.0,>=8.2.2->spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (0.1.4)\n",
+            "Requirement already satisfied: click<9.0.0,>=7.1.1 in /usr/local/lib/python3.10/dist-packages (from typer<0.10.0,>=0.3.0->spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (8.1.7)\n",
+            "Requirement already satisfied: cloudpathlib<0.17.0,>=0.7.0 in /usr/local/lib/python3.10/dist-packages (from weasel<0.4.0,>=0.1.0->spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (0.16.0)\n",
+            "Requirement already satisfied: MarkupSafe>=2.0 in /usr/local/lib/python3.10/dist-packages (from jinja2->spacy<3.8.0,>=3.7.2->en-core-web-sm==3.7.1) (2.1.5)\n",
+            "\u001b[38;5;2m✔ Download and installation successful\u001b[0m\n",
+            "You can now load the package via spacy.load('en_core_web_sm')\n",
+            "\u001b[38;5;3m⚠ Restart to reload dependencies\u001b[0m\n",
+            "If you are in a Jupyter or Colab notebook, you may need to restart Python in\n",
+            "order to load all the package's dependencies. You can do this by selecting the\n",
+            "'Restart kernel' or 'Restart runtime' option.\n",
+            "Collecting de-core-news-sm==3.7.0\n",
+            "  Using cached https://github.com/explosion/spacy-models/releases/download/de_core_news_sm-3.7.0/de_core_news_sm-3.7.0-py3-none-any.whl (14.6 MB)\n",
+            "Requirement already satisfied: spacy<3.8.0,>=3.7.0 in /usr/local/lib/python3.10/dist-packages (from de-core-news-sm==3.7.0) (3.7.4)\n",
+            "Requirement already satisfied: spacy-legacy<3.1.0,>=3.0.11 in /usr/local/lib/python3.10/dist-packages (from spacy<3.8.0,>=3.7.0->de-core-news-sm==3.7.0) (3.0.12)\n",
+            "Requirement already satisfied: spacy-loggers<2.0.0,>=1.0.0 in /usr/local/lib/python3.10/dist-packages (from spacy<3.8.0,>=3.7.0->de-core-news-sm==3.7.0) (1.0.5)\n",
+            "Requirement already satisfied: murmurhash<1.1.0,>=0.28.0 in /usr/local/lib/python3.10/dist-packages (from spacy<3.8.0,>=3.7.0->de-core-news-sm==3.7.0) (1.0.10)\n",
+            "Requirement already satisfied: cymem<2.1.0,>=2.0.2 in /usr/local/lib/python3.10/dist-packages (from spacy<3.8.0,>=3.7.0->de-core-news-sm==3.7.0) (2.0.8)\n",
+            "Requirement already satisfied: preshed<3.1.0,>=3.0.2 in /usr/local/lib/python3.10/dist-packages (from spacy<3.8.0,>=3.7.0->de-core-news-sm==3.7.0) (3.0.9)\n",
+            "Requirement already satisfied: thinc<8.3.0,>=8.2.2 in /usr/local/lib/python3.10/dist-packages (from spacy<3.8.0,>=3.7.0->de-core-news-sm==3.7.0) (8.2.3)\n",
+            "Requirement already satisfied: wasabi<1.2.0,>=0.9.1 in /usr/local/lib/python3.10/dist-packages (from spacy<3.8.0,>=3.7.0->de-core-news-sm==3.7.0) (1.1.2)\n",
+            "Requirement already satisfied: srsly<3.0.0,>=2.4.3 in /usr/local/lib/python3.10/dist-packages (from spacy<3.8.0,>=3.7.0->de-core-news-sm==3.7.0) (2.4.8)\n",
+            "Requirement already satisfied: catalogue<2.1.0,>=2.0.6 in /usr/local/lib/python3.10/dist-packages (from spacy<3.8.0,>=3.7.0->de-core-news-sm==3.7.0) (2.0.10)\n",
+            "Requirement already satisfied: weasel<0.4.0,>=0.1.0 in /usr/local/lib/python3.10/dist-packages (from spacy<3.8.0,>=3.7.0->de-core-news-sm==3.7.0) (0.3.4)\n",
+            "Requirement already satisfied: typer<0.10.0,>=0.3.0 in /usr/local/lib/python3.10/dist-packages (from spacy<3.8.0,>=3.7.0->de-core-news-sm==3.7.0) (0.9.4)\n",
+            "Requirement already satisfied: smart-open<7.0.0,>=5.2.1 in /usr/local/lib/python3.10/dist-packages (from spacy<3.8.0,>=3.7.0->de-core-news-sm==3.7.0) (6.4.0)\n",
+            "Requirement already satisfied: tqdm<5.0.0,>=4.38.0 in /usr/local/lib/python3.10/dist-packages (from spacy<3.8.0,>=3.7.0->de-core-news-sm==3.7.0) (4.66.2)\n",
+            "Requirement already satisfied: requests<3.0.0,>=2.13.0 in /usr/local/lib/python3.10/dist-packages (from spacy<3.8.0,>=3.7.0->de-core-news-sm==3.7.0) (2.31.0)\n",
+            "Requirement already satisfied: pydantic!=1.8,!=1.8.1,<3.0.0,>=1.7.4 in /usr/local/lib/python3.10/dist-packages (from spacy<3.8.0,>=3.7.0->de-core-news-sm==3.7.0) (2.6.4)\n",
+            "Requirement already satisfied: jinja2 in /usr/local/lib/python3.10/dist-packages (from spacy<3.8.0,>=3.7.0->de-core-news-sm==3.7.0) (3.1.3)\n",
+            "Requirement already satisfied: setuptools in /usr/local/lib/python3.10/dist-packages (from spacy<3.8.0,>=3.7.0->de-core-news-sm==3.7.0) (67.7.2)\n",
+            "Requirement already satisfied: packaging>=20.0 in /usr/local/lib/python3.10/dist-packages (from spacy<3.8.0,>=3.7.0->de-core-news-sm==3.7.0) (24.0)\n",
+            "Requirement already satisfied: langcodes<4.0.0,>=3.2.0 in /usr/local/lib/python3.10/dist-packages (from spacy<3.8.0,>=3.7.0->de-core-news-sm==3.7.0) (3.3.0)\n",
+            "Requirement already satisfied: numpy>=1.19.0 in /usr/local/lib/python3.10/dist-packages (from spacy<3.8.0,>=3.7.0->de-core-news-sm==3.7.0) (1.25.2)\n",
+            "Requirement already satisfied: annotated-types>=0.4.0 in /usr/local/lib/python3.10/dist-packages (from pydantic!=1.8,!=1.8.1,<3.0.0,>=1.7.4->spacy<3.8.0,>=3.7.0->de-core-news-sm==3.7.0) (0.6.0)\n",
+            "Requirement already satisfied: pydantic-core==2.16.3 in /usr/local/lib/python3.10/dist-packages (from pydantic!=1.8,!=1.8.1,<3.0.0,>=1.7.4->spacy<3.8.0,>=3.7.0->de-core-news-sm==3.7.0) (2.16.3)\n",
+            "Requirement already satisfied: typing-extensions>=4.6.1 in /usr/local/lib/python3.10/dist-packages (from pydantic!=1.8,!=1.8.1,<3.0.0,>=1.7.4->spacy<3.8.0,>=3.7.0->de-core-news-sm==3.7.0) (4.10.0)\n",
+            "Requirement already satisfied: charset-normalizer<4,>=2 in /usr/local/lib/python3.10/dist-packages (from requests<3.0.0,>=2.13.0->spacy<3.8.0,>=3.7.0->de-core-news-sm==3.7.0) (3.3.2)\n",
+            "Requirement already satisfied: idna<4,>=2.5 in /usr/local/lib/python3.10/dist-packages (from requests<3.0.0,>=2.13.0->spacy<3.8.0,>=3.7.0->de-core-news-sm==3.7.0) (3.6)\n",
+            "Requirement already satisfied: urllib3<3,>=1.21.1 in /usr/local/lib/python3.10/dist-packages (from requests<3.0.0,>=2.13.0->spacy<3.8.0,>=3.7.0->de-core-news-sm==3.7.0) (2.0.7)\n",
+            "Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.10/dist-packages (from requests<3.0.0,>=2.13.0->spacy<3.8.0,>=3.7.0->de-core-news-sm==3.7.0) (2024.2.2)\n",
+            "Requirement already satisfied: blis<0.8.0,>=0.7.8 in /usr/local/lib/python3.10/dist-packages (from thinc<8.3.0,>=8.2.2->spacy<3.8.0,>=3.7.0->de-core-news-sm==3.7.0) (0.7.11)\n",
+            "Requirement already satisfied: confection<1.0.0,>=0.0.1 in /usr/local/lib/python3.10/dist-packages (from thinc<8.3.0,>=8.2.2->spacy<3.8.0,>=3.7.0->de-core-news-sm==3.7.0) (0.1.4)\n",
+            "Requirement already satisfied: click<9.0.0,>=7.1.1 in /usr/local/lib/python3.10/dist-packages (from typer<0.10.0,>=0.3.0->spacy<3.8.0,>=3.7.0->de-core-news-sm==3.7.0) (8.1.7)\n",
+            "Requirement already satisfied: cloudpathlib<0.17.0,>=0.7.0 in /usr/local/lib/python3.10/dist-packages (from weasel<0.4.0,>=0.1.0->spacy<3.8.0,>=3.7.0->de-core-news-sm==3.7.0) (0.16.0)\n",
+            "Requirement already satisfied: MarkupSafe>=2.0 in /usr/local/lib/python3.10/dist-packages (from jinja2->spacy<3.8.0,>=3.7.0->de-core-news-sm==3.7.0) (2.1.5)\n",
+            "\u001b[38;5;2m✔ Download and installation successful\u001b[0m\n",
+            "You can now load the package via spacy.load('de_core_news_sm')\n",
+            "\u001b[38;5;3m⚠ Restart to reload dependencies\u001b[0m\n",
+            "If you are in a Jupyter or Colab notebook, you may need to restart Python in\n",
+            "order to load all the package's dependencies. You can do this by selecting the\n",
+            "'Restart kernel' or 'Restart runtime' option.\n"
+          ]
+        }
+      ],
+      "source": [
+        "!python -m spacy download en_core_web_sm\n",
+        "!python -m spacy download de_core_news_sm"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {
+        "id": "Vmir-6Ppki3_"
+      },
+      "outputs": [],
+      "source": [
+        "!pip install portalocker>=2.0.0"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": 92,
+      "metadata": {
+        "colab": {
+          "base_uri": "https://localhost:8080/"
+        },
+        "id": "nzh92t5UW9bu",
+        "outputId": "4db35419-1b6d-413f-89b8-791214a07826"
+      },
+      "outputs": [
+        {
+          "output_type": "stream",
+          "name": "stderr",
+          "text": [
+            "/usr/local/lib/python3.10/dist-packages/spacy/util.py:1740: UserWarning: [W111] Jupyter notebook detected: if using `prefer_gpu()` or `require_gpu()`, include it in the same cell right before `spacy.load()` to ensure that the model is loaded on the correct device. More information: http://spacy.io/usage/v3#jupyter-notebook-gpu\n",
+            "  warnings.warn(Warnings.W111)\n"
+          ]
+        }
+      ],
+      "source": [
+        "token_transform[SRC_LANGUAGE] = get_tokenizer('spacy', language='de_core_news_sm')\n",
+        "token_transform[TGT_LANGUAGE] = get_tokenizer('spacy', language='en_core_web_sm')\n",
+        "\n",
+        "\n",
+        "# helper function to yield list of tokens\n",
+        "def yield_tokens(data_iter: Iterable, language: str) -> List[str]:\n",
+        "    language_index = {SRC_LANGUAGE: 0, TGT_LANGUAGE: 1}\n",
+        "\n",
+        "    for data_sample in data_iter:\n",
+        "        yield token_transform[language](data_sample[language_index[language]])\n",
+        "\n",
+        "# Define special symbols and indices\n",
+        "UNK_IDX, PAD_IDX, BOS_IDX, EOS_IDX = 0, 1, 2, 3\n",
+        "# Make sure the tokens are in order of their indices to properly insert them in vocab\n",
+        "special_symbols = ['<unk>', '<pad>', '<bos>', '<eos>']\n",
+        "\n",
+        "for ln in [SRC_LANGUAGE, TGT_LANGUAGE]:\n",
+        "    # Training data Iterator\n",
+        "    train_iter = Multi30k(split='train', language_pair=(SRC_LANGUAGE, TGT_LANGUAGE))\n",
+        "    # Create torchtext's Vocab object\n",
+        "    vocab_transform[ln] = build_vocab_from_iterator(yield_tokens(train_iter, ln),\n",
+        "                                                    min_freq=1,\n",
+        "                                                    specials=special_symbols,\n",
+        "                                                    special_first=True)\n",
+        "\n",
+        "# Set ``UNK_IDX`` as the default index. This index is returned when the token is not found.\n",
+        "# If not set, it throws ``RuntimeError`` when the queried token is not found in the Vocabulary.\n",
+        "for ln in [SRC_LANGUAGE, TGT_LANGUAGE]:\n",
+        "  vocab_transform[ln].set_default_index(UNK_IDX)"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": 93,
+      "metadata": {
+        "id": "OB_yiHCaXKv8"
+      },
+      "outputs": [],
+      "source": [
+        "from torch import Tensor\n",
+        "import torch\n",
+        "import torch.nn as nn\n",
+        "from torch.nn import Transformer\n",
+        "import math\n",
+        "DEVICE = torch.device('cuda' if torch.cuda.is_available() else 'cpu')\n",
+        "\n",
+        "# helper Module that adds positional encoding to the token embedding to introduce a notion of word order.\n",
+        "class PositionalEncoding(nn.Module):\n",
+        "    def __init__(self,\n",
+        "                 emb_size: int,\n",
+        "                 dropout: float,\n",
+        "                 maxlen: int = 5000):\n",
+        "        super(PositionalEncoding, self).__init__()\n",
+        "        den = torch.exp(- torch.arange(0, emb_size, 2)* math.log(10000) / emb_size)\n",
+        "        pos = torch.arange(0, maxlen).reshape(maxlen, 1)\n",
+        "        pos_embedding = torch.zeros((maxlen, emb_size))\n",
+        "        pos_embedding[:, 0::2] = torch.sin(pos * den)\n",
+        "        pos_embedding[:, 1::2] = torch.cos(pos * den)\n",
+        "        pos_embedding = pos_embedding.unsqueeze(-2)\n",
+        "\n",
+        "        self.dropout = nn.Dropout(dropout)\n",
+        "        self.register_buffer('pos_embedding', pos_embedding)\n",
+        "\n",
+        "    def forward(self, token_embedding: Tensor):\n",
+        "        return self.dropout(token_embedding + self.pos_embedding[:token_embedding.size(0), :])\n",
+        "\n",
+        "# helper Module to convert tensor of input indices into corresponding tensor of token embeddings\n",
+        "class TokenEmbedding(nn.Module):\n",
+        "    def __init__(self, vocab_size: int, emb_size):\n",
+        "        super(TokenEmbedding, self).__init__()\n",
+        "        self.embedding = nn.Embedding(vocab_size, emb_size)\n",
+        "        self.emb_size = emb_size\n",
+        "\n",
+        "    def forward(self, tokens: Tensor):\n",
+        "        return self.embedding(tokens.long()) * math.sqrt(self.emb_size)\n",
+        "\n",
+        "# Seq2Seq Network\n",
+        "class Seq2SeqTransformer(nn.Module):\n",
+        "    def __init__(self,\n",
+        "                 num_encoder_layers: int,\n",
+        "                 num_decoder_layers: int,\n",
+        "                 emb_size: int,\n",
+        "                 nhead: int,\n",
+        "                 src_vocab_size: int,\n",
+        "                 tgt_vocab_size: int,\n",
+        "                 dim_feedforward: int = 512,\n",
+        "                 dropout: float = 0.1):\n",
+        "        super(Seq2SeqTransformer, self).__init__()\n",
+        "        self.transformer = Transformer(d_model=emb_size,\n",
+        "                                       nhead=nhead,\n",
+        "                                       num_encoder_layers=num_encoder_layers,\n",
+        "                                       num_decoder_layers=num_decoder_layers,\n",
+        "                                       dim_feedforward=dim_feedforward,\n",
+        "                                       dropout=dropout)\n",
+        "        self.generator = nn.Linear(emb_size, tgt_vocab_size)\n",
+        "        self.src_tok_emb = TokenEmbedding(src_vocab_size, emb_size)\n",
+        "        self.tgt_tok_emb = TokenEmbedding(tgt_vocab_size, emb_size)\n",
+        "        self.positional_encoding = PositionalEncoding(\n",
+        "            emb_size, dropout=dropout)\n",
+        "\n",
+        "    def forward(self,\n",
+        "                src: Tensor,\n",
+        "                trg: Tensor,\n",
+        "                src_mask: Tensor,\n",
+        "                tgt_mask: Tensor,\n",
+        "                src_padding_mask: Tensor,\n",
+        "                tgt_padding_mask: Tensor,\n",
+        "                memory_key_padding_mask: Tensor):\n",
+        "        src_emb = self.positional_encoding(self.src_tok_emb(src))\n",
+        "        tgt_emb = self.positional_encoding(self.tgt_tok_emb(trg))\n",
+        "        outs = self.transformer(src_emb, tgt_emb, src_mask, tgt_mask, None,\n",
+        "                                src_padding_mask, tgt_padding_mask, memory_key_padding_mask)\n",
+        "        return self.generator(outs)\n",
+        "\n",
+        "    def encode(self, src: Tensor, src_mask: Tensor):\n",
+        "        return self.transformer.encoder(self.positional_encoding(\n",
+        "                            self.src_tok_emb(src)), src_mask)\n",
+        "\n",
+        "    def decode(self, tgt: Tensor, memory: Tensor, tgt_mask: Tensor):\n",
+        "        return self.transformer.decoder(self.positional_encoding(\n",
+        "                          self.tgt_tok_emb(tgt)), memory,\n",
+        "                          tgt_mask)"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": 94,
+      "metadata": {
+        "id": "ECpJWZp2r_xa"
+      },
+      "outputs": [],
+      "source": [
+        "from torch import Tensor\n",
+        "import torch\n",
+        "import torch.nn as nn\n",
+        "from torch.nn import Transformer\n",
+        "import math\n",
+        "DEVICE = torch.device('cuda' if torch.cuda.is_available() else 'cpu')\n",
+        "\n",
+        "# helper Module that adds positional encoding to the token embedding to introduce a notion of word order.\n",
+        "class PositionalEncoding(nn.Module):\n",
+        "    def __init__(self,\n",
+        "                 emb_size: int,\n",
+        "                 dropout: float,\n",
+        "                 maxlen: int = 5000):\n",
+        "        super(PositionalEncoding, self).__init__()\n",
+        "        den = torch.exp(- torch.arange(0, emb_size, 2)* math.log(10000) / emb_size)\n",
+        "        pos = torch.arange(0, maxlen).reshape(maxlen, 1)\n",
+        "        pos_embedding = torch.zeros((maxlen, emb_size))\n",
+        "        pos_embedding[:, 0::2] = torch.sin(pos * den)\n",
+        "        pos_embedding[:, 1::2] = torch.cos(pos * den)\n",
+        "        pos_embedding = pos_embedding.unsqueeze(-2)\n",
+        "\n",
+        "        self.dropout = nn.Dropout(dropout)\n",
+        "        self.register_buffer('pos_embedding', pos_embedding)\n",
+        "\n",
+        "    def forward(self, token_embedding: Tensor):\n",
+        "        return self.dropout(token_embedding + self.pos_embedding[:token_embedding.size(0), :])\n",
+        "\n",
+        "# helper Module to convert tensor of input indices into corresponding tensor of token embeddings\n",
+        "class TokenEmbedding(nn.Module):\n",
+        "    def __init__(self, vocab_size: int, emb_size):\n",
+        "        super(TokenEmbedding, self).__init__()\n",
+        "        self.embedding = nn.Embedding(vocab_size, emb_size)\n",
+        "        self.emb_size = emb_size\n",
+        "\n",
+        "    def forward(self, tokens: Tensor):\n",
+        "        return self.embedding(tokens.long()) * math.sqrt(self.emb_size)\n",
+        "\n",
+        "# Seq2Seq Network\n",
+        "class Seq2SeqTransformer(nn.Module):\n",
+        "    def __init__(self,\n",
+        "                 num_encoder_layers: int,\n",
+        "                 num_decoder_layers: int,\n",
+        "                 emb_size: int,\n",
+        "                 nhead: int,\n",
+        "                 src_vocab_size: int,\n",
+        "                 tgt_vocab_size: int,\n",
+        "                 dim_feedforward: int = 512,\n",
+        "                 dropout: float = 0.1):\n",
+        "        super(Seq2SeqTransformer, self).__init__()\n",
+        "        self.transformer = Transformer(d_model=emb_size,\n",
+        "                                       nhead=nhead,\n",
+        "                                       num_encoder_layers=num_encoder_layers,\n",
+        "                                       num_decoder_layers=num_decoder_layers,\n",
+        "                                       dim_feedforward=dim_feedforward,\n",
+        "                                       dropout=dropout)\n",
+        "        self.generator = nn.Linear(emb_size, tgt_vocab_size)\n",
+        "        self.src_tok_emb = TokenEmbedding(src_vocab_size, emb_size)\n",
+        "        self.tgt_tok_emb = TokenEmbedding(tgt_vocab_size, emb_size)\n",
+        "        self.positional_encoding = PositionalEncoding(\n",
+        "            emb_size, dropout=dropout)\n",
+        "\n",
+        "    def forward(self,\n",
+        "                src: Tensor,\n",
+        "                trg: Tensor,\n",
+        "                src_mask: Tensor,\n",
+        "                tgt_mask: Tensor,\n",
+        "                src_padding_mask: Tensor,\n",
+        "                tgt_padding_mask: Tensor,\n",
+        "                memory_key_padding_mask: Tensor):\n",
+        "        src_emb = self.positional_encoding(self.src_tok_emb(src))\n",
+        "        tgt_emb = self.positional_encoding(self.tgt_tok_emb(trg))\n",
+        "        outs = self.transformer(src_emb, tgt_emb, src_mask, tgt_mask, None,\n",
+        "                                src_padding_mask, tgt_padding_mask, memory_key_padding_mask)\n",
+        "        return self.generator(outs)\n",
+        "\n",
+        "    def encode(self, src: Tensor, src_mask: Tensor):\n",
+        "        return self.transformer.encoder(self.positional_encoding(\n",
+        "                            self.src_tok_emb(src)), src_mask)\n",
+        "\n",
+        "    def decode(self, tgt: Tensor, memory: Tensor, tgt_mask: Tensor):\n",
+        "        return self.transformer.decoder(self.positional_encoding(\n",
+        "                          self.tgt_tok_emb(tgt)), memory,\n",
+        "                          tgt_mask)"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": 95,
+      "metadata": {
+        "id": "PUIS0MWUZCKc"
+      },
+      "outputs": [],
+      "source": [
+        "def generate_square_subsequent_mask(sz):\n",
+        "    mask = (torch.triu(torch.ones((sz, sz), device=DEVICE)) == 1).transpose(0, 1)\n",
+        "    mask = mask.float().masked_fill(mask == 0, float('-inf')).masked_fill(mask == 1, float(0.0))\n",
+        "    return mask\n",
+        "\n",
+        "\n",
+        "def create_mask(src, tgt):\n",
+        "    src_seq_len = src.shape[0]\n",
+        "    tgt_seq_len = tgt.shape[0]\n",
+        "\n",
+        "    tgt_mask = generate_square_subsequent_mask(tgt_seq_len)\n",
+        "    src_mask = torch.zeros((src_seq_len, src_seq_len),device=DEVICE).type(torch.bool)\n",
+        "\n",
+        "    src_padding_mask = (src == PAD_IDX).transpose(0, 1)\n",
+        "    tgt_padding_mask = (tgt == PAD_IDX).transpose(0, 1)\n",
+        "    return src_mask, tgt_mask, src_padding_mask, tgt_padding_mask"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": 96,
+      "metadata": {
+        "colab": {
+          "base_uri": "https://localhost:8080/"
+        },
+        "id": "DA3eAj9GZFus",
+        "outputId": "8132fcb6-84c1-44c9-a150-616467d36052"
+      },
+      "outputs": [
+        {
+          "output_type": "stream",
+          "name": "stderr",
+          "text": [
+            "/usr/local/lib/python3.10/dist-packages/torch/nn/modules/transformer.py:286: UserWarning: enable_nested_tensor is True, but self.use_nested_tensor is False because encoder_layer.self_attn.batch_first was not True(use batch_first for better inference performance)\n",
+            "  warnings.warn(f\"enable_nested_tensor is True, but self.use_nested_tensor is False because {why_not_sparsity_fast_path}\")\n"
+          ]
+        }
+      ],
+      "source": [
+        "torch.manual_seed(0)\n",
+        "\n",
+        "SRC_VOCAB_SIZE = len(vocab_transform[SRC_LANGUAGE])\n",
+        "TGT_VOCAB_SIZE = len(vocab_transform[TGT_LANGUAGE])\n",
+        "EMB_SIZE = 512\n",
+        "NHEAD = 8\n",
+        "FFN_HID_DIM = 512\n",
+        "BATCH_SIZE = 128\n",
+        "NUM_ENCODER_LAYERS = 3\n",
+        "NUM_DECODER_LAYERS = 3\n",
+        "\n",
+        "transformer = Seq2SeqTransformer(NUM_ENCODER_LAYERS, NUM_DECODER_LAYERS, EMB_SIZE,\n",
+        "                                 NHEAD, SRC_VOCAB_SIZE, TGT_VOCAB_SIZE, FFN_HID_DIM)\n",
+        "\n",
+        "for p in transformer.parameters():\n",
+        "    if p.dim() > 1:\n",
+        "        nn.init.xavier_uniform_(p)\n",
+        "\n",
+        "transformer = transformer.to(DEVICE)\n",
+        "\n",
+        "loss_fn = torch.nn.CrossEntropyLoss(ignore_index=PAD_IDX)\n",
+        "\n",
+        "optimizer = torch.optim.Adam(transformer.parameters(), lr=0.0001, betas=(0.9, 0.98), eps=1e-9)"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": 97,
+      "metadata": {
+        "id": "IO9Y95SnZKys"
+      },
+      "outputs": [],
+      "source": [
+        "from torch.nn.utils.rnn import pad_sequence\n",
+        "\n",
+        "# helper function to club together sequential operations\n",
+        "def sequential_transforms(*transforms):\n",
+        "    def func(txt_input):\n",
+        "        for transform in transforms:\n",
+        "            txt_input = transform(txt_input)\n",
+        "        return txt_input\n",
+        "    return func\n",
+        "\n",
+        "# function to add BOS/EOS and create tensor for input sequence indices\n",
+        "def tensor_transform(token_ids: List[int]):\n",
+        "    return torch.cat((torch.tensor([BOS_IDX]),\n",
+        "                      torch.tensor(token_ids),\n",
+        "                      torch.tensor([EOS_IDX])))\n",
+        "\n",
+        "# ``src`` and ``tgt`` language text transforms to convert raw strings into tensors indices\n",
+        "text_transform = {}\n",
+        "for ln in [SRC_LANGUAGE, TGT_LANGUAGE]:\n",
+        "    text_transform[ln] = sequential_transforms(token_transform[ln], #Tokenization\n",
+        "                                               vocab_transform[ln], #Numericalization\n",
+        "                                               tensor_transform) # Add BOS/EOS and create tensor\n",
+        "\n",
+        "\n",
+        "# function to collate data samples into batch tensors\n",
+        "def collate_fn(batch):\n",
+        "    src_batch, tgt_batch = [], []\n",
+        "    for src_sample, tgt_sample in batch:\n",
+        "        src_batch.append(text_transform[SRC_LANGUAGE](src_sample.rstrip(\"\\n\")))\n",
+        "        tgt_batch.append(text_transform[TGT_LANGUAGE](tgt_sample.rstrip(\"\\n\")))\n",
+        "\n",
+        "    src_batch = pad_sequence(src_batch, padding_value=PAD_IDX)\n",
+        "    tgt_batch = pad_sequence(tgt_batch, padding_value=PAD_IDX)\n",
+        "    return src_batch, tgt_batch"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": 98,
+      "metadata": {
+        "id": "qw9lO5xvZSjb"
+      },
+      "outputs": [],
+      "source": [
+        "from torch.utils.data import DataLoader\n",
+        "\n",
+        "def train_epoch(model, optimizer):\n",
+        "    model.train()\n",
+        "    losses = 0\n",
+        "    train_iter = Multi30k(split='train', language_pair=(SRC_LANGUAGE, TGT_LANGUAGE))\n",
+        "    train_dataloader = DataLoader(train_iter, batch_size=BATCH_SIZE, collate_fn=collate_fn)\n",
+        "\n",
+        "    for src, tgt in train_dataloader:\n",
+        "        src = src.to(DEVICE)\n",
+        "        tgt = tgt.to(DEVICE)\n",
+        "\n",
+        "        tgt_input = tgt[:-1, :]\n",
+        "\n",
+        "        src_mask, tgt_mask, src_padding_mask, tgt_padding_mask = create_mask(src, tgt_input)\n",
+        "\n",
+        "        logits = model(src, tgt_input, src_mask, tgt_mask,src_padding_mask, tgt_padding_mask, src_padding_mask)\n",
+        "\n",
+        "        optimizer.zero_grad()\n",
+        "\n",
+        "        tgt_out = tgt[1:, :]\n",
+        "        loss = loss_fn(logits.reshape(-1, logits.shape[-1]), tgt_out.reshape(-1))\n",
+        "        loss.backward()\n",
+        "\n",
+        "        optimizer.step()\n",
+        "        losses += loss.item()\n",
+        "\n",
+        "    return losses / len(list(train_dataloader))"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": 99,
+      "metadata": {
+        "id": "frdDbhZ_ZZ9d"
+      },
+      "outputs": [],
+      "source": [
+        "def evaluate(model):\n",
+        "    model.eval()\n",
+        "    losses = 0\n",
+        "\n",
+        "    val_iter = Multi30k(split='valid', language_pair=(SRC_LANGUAGE, TGT_LANGUAGE))\n",
+        "    val_dataloader = DataLoader(val_iter, batch_size=BATCH_SIZE, collate_fn=collate_fn)\n",
+        "\n",
+        "    for src, tgt in val_dataloader:\n",
+        "        src = src.to(DEVICE)\n",
+        "        tgt = tgt.to(DEVICE)\n",
+        "\n",
+        "        tgt_input = tgt[:-1, :]\n",
+        "\n",
+        "        src_mask, tgt_mask, src_padding_mask, tgt_padding_mask = create_mask(src, tgt_input)\n",
+        "\n",
+        "        logits = model(src, tgt_input, src_mask, tgt_mask,src_padding_mask, tgt_padding_mask, src_padding_mask)\n",
+        "\n",
+        "        tgt_out = tgt[1:, :]\n",
+        "        loss = loss_fn(logits.reshape(-1, logits.shape[-1]), tgt_out.reshape(-1))\n",
+        "        losses += loss.item()\n",
+        "\n",
+        "    return losses / len(list(val_dataloader))"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {
+        "colab": {
+          "base_uri": "https://localhost:8080/"
+        },
+        "id": "xjLl776lZfJc",
+        "outputId": "6f0965d6-6e53-40b7-fe19-69096b68c3f8"
+      },
+      "outputs": [
+        {
+          "metadata": {
+            "tags": null
+          },
+          "name": "stderr",
+          "output_type": "stream",
+          "text": [
+            "/usr/local/lib/python3.10/dist-packages/torch/nn/functional.py:5109: UserWarning: Support for mismatched key_padding_mask and attn_mask is deprecated. Use same type for both instead.\n",
+            "  warnings.warn(\n",
+            "/usr/local/lib/python3.10/dist-packages/torch/utils/data/datapipes/iter/combining.py:337: UserWarning: Some child DataPipes are not exhausted when __iter__ is called. We are resetting the buffer and each child DataPipe will read from the start again.\n",
+            "  warnings.warn(\"Some child DataPipes are not exhausted when __iter__ is called. We are resetting \"\n"
+          ]
+        },
+        {
+          "output_type": "stream",
+          "name": "stdout",
+          "text": [
+            "Epoch: 1, Train loss: 5.344, Val loss: 4.106, Epoch time = 43.253s\n",
+            "Epoch: 2, Train loss: 3.761, Val loss: 3.309, Epoch time = 43.216s\n",
+            "Epoch: 3, Train loss: 3.157, Val loss: 2.887, Epoch time = 43.028s\n",
+            "Epoch: 4, Train loss: 2.767, Val loss: 2.640, Epoch time = 43.509s\n",
+            "Epoch: 5, Train loss: 2.477, Val loss: 2.442, Epoch time = 44.192s\n",
+            "Epoch: 6, Train loss: 2.247, Val loss: 2.306, Epoch time = 44.518s\n",
+            "Epoch: 7, Train loss: 2.055, Val loss: 2.207, Epoch time = 43.989s\n"
+          ]
+        }
+      ],
+      "source": [
+        "from timeit import default_timer as timer\n",
+        "NUM_EPOCHS = 10\n",
+        "\n",
+        "for epoch in range(1, NUM_EPOCHS+1):\n",
+        "    start_time = timer()\n",
+        "    train_loss = train_epoch(transformer, optimizer)\n",
+        "    end_time = timer()\n",
+        "    val_loss = evaluate(transformer)\n",
+        "    print((f\"Epoch: {epoch}, Train loss: {train_loss:.3f}, Val loss: {val_loss:.3f}, \"f\"Epoch time = {(end_time - start_time):.3f}s\"))\n"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": 20,
+      "metadata": {
+        "id": "ebEhLx-3slOE"
+      },
+      "outputs": [],
+      "source": [
+        "torch.save(transformer.state_dict(), '/gdrive/My Drive/transformer_model.pth')"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": 58,
+      "metadata": {
+        "id": "OW8D2ALUtBQq"
+      },
+      "outputs": [],
+      "source": [
+        "def greedy_decode(model, src, src_mask, max_len, start_symbol):\n",
+        "    src = src.to(DEVICE)\n",
+        "    src_mask = src_mask.to(DEVICE)\n",
+        "\n",
+        "    memory = model.encode(src, src_mask)\n",
+        "    ys = torch.ones(1, 1).fill_(start_symbol).type(torch.long).to(DEVICE)\n",
+        "    for i in range(max_len-1):\n",
+        "        memory = memory.to(DEVICE)\n",
+        "        tgt_mask = (generate_square_subsequent_mask(ys.size(0))\n",
+        "                    .type(torch.bool)).to(DEVICE)\n",
+        "        out = model.decode(ys, memory, tgt_mask)\n",
+        "        out = out.transpose(0, 1)\n",
+        "        prob = model.generator(out[:, -1])\n",
+        "        _, next_word = torch.max(prob, dim=1)\n",
+        "        next_word = next_word.item()\n",
+        "\n",
+        "        ys = torch.cat([ys,\n",
+        "                        torch.ones(1, 1).type_as(src.data).fill_(next_word)], dim=0)\n",
+        "        if next_word == EOS_IDX:\n",
+        "            break\n",
+        "    return ys"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": 59,
+      "metadata": {
+        "id": "exM3fCaBtFk2",
+        "colab": {
+          "base_uri": "https://localhost:8080/"
+        },
+        "outputId": "726a1bab-c145-4861-f4d3-6cb5122a567c"
+      },
+      "outputs": [
+        {
+          "output_type": "stream",
+          "name": "stdout",
+          "text": [
+            "3\n",
+            "3\n",
+            "512\n",
+            "8\n",
+            "19214\n",
+            "10837\n",
+            "512\n"
+          ]
+        }
+      ],
+      "source": [
+        "# Load the saved model\n",
+        "loaded_model = Seq2SeqTransformer(NUM_ENCODER_LAYERS, NUM_DECODER_LAYERS, EMB_SIZE,\n",
+        "                                  NHEAD, SRC_VOCAB_SIZE, TGT_VOCAB_SIZE, FFN_HID_DIM)\n",
+        "print(NUM_ENCODER_LAYERS)\n",
+        "print(NUM_DECODER_LAYERS)\n",
+        "print(EMB_SIZE)\n",
+        "print(NHEAD)\n",
+        "print(SRC_VOCAB_SIZE)\n",
+        "print(TGT_VOCAB_SIZE)\n",
+        "print(FFN_HID_DIM)\n",
+        "loaded_model.load_state_dict(torch.load('/gdrive/My Drive/transformer_model.pth'))\n",
+        "loaded_model.eval()  # Make sure to set the model in evaluation mode\n",
+        "\n",
+        "# Incorporate the loaded model into the remaining portion of your code\n",
+        "def translate(model: torch.nn.Module, src_sentence: str):\n",
+        "    model.eval()\n",
+        "    src = text_transform[SRC_LANGUAGE](src_sentence).view(-1, 1)\n",
+        "    num_tokens = src.shape[0]\n",
+        "    src_mask = (torch.zeros(num_tokens, num_tokens)).type(torch.bool)\n",
+        "    tgt_tokens = greedy_decode(\n",
+        "        model,  src, src_mask, max_len=num_tokens + 5, start_symbol=BOS_IDX).flatten()\n",
+        "    return \" \".join(vocab_transform[TGT_LANGUAGE].lookup_tokens(list(tgt_tokens.cpu().numpy()))).replace(\"<bos>\", \"\").replace(\"<eos>\", \"\")\n"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": 60,
+      "metadata": {
+        "id": "85yPR0zBtOsZ",
+        "colab": {
+          "base_uri": "https://localhost:8080/"
+        },
+        "outputId": "44efc93c-5d86-4084-fc21-bb3bc5bae207"
+      },
+      "outputs": [
+        {
+          "output_type": "stream",
+          "name": "stdout",
+          "text": [
+            " Russia cloth spoof Russia sewing Madrid Madrid Russia silhouetted Madrid Russia Madrid Madrid Russia cloth\n"
+          ]
+        }
+      ],
+      "source": [
+        "print(translate(transformer, \"Eine Gruppe von Menschen steht vor einem Iglu .\"))"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": 24,
+      "metadata": {
+        "id": "HJF7lXj0tPjO",
+        "colab": {
+          "base_uri": "https://localhost:8080/"
+        },
+        "outputId": "0237b57f-29cf-4c75-a060-fb928dbd2ced"
+      },
+      "outputs": [
+        {
+          "output_type": "stream",
+          "name": "stdout",
+          "text": [
+            "Requirement already satisfied: transformers in /usr/local/lib/python3.10/dist-packages (4.38.2)\n",
+            "Requirement already satisfied: filelock in /usr/local/lib/python3.10/dist-packages (from transformers) (3.13.3)\n",
+            "Requirement already satisfied: huggingface-hub<1.0,>=0.19.3 in /usr/local/lib/python3.10/dist-packages (from transformers) (0.20.3)\n",
+            "Requirement already satisfied: numpy>=1.17 in /usr/local/lib/python3.10/dist-packages (from transformers) (1.25.2)\n",
+            "Requirement already satisfied: packaging>=20.0 in /usr/local/lib/python3.10/dist-packages (from transformers) (24.0)\n",
+            "Requirement already satisfied: pyyaml>=5.1 in /usr/local/lib/python3.10/dist-packages (from transformers) (6.0.1)\n",
+            "Requirement already satisfied: regex!=2019.12.17 in /usr/local/lib/python3.10/dist-packages (from transformers) (2023.12.25)\n",
+            "Requirement already satisfied: requests in /usr/local/lib/python3.10/dist-packages (from transformers) (2.31.0)\n",
+            "Requirement already satisfied: tokenizers<0.19,>=0.14 in /usr/local/lib/python3.10/dist-packages (from transformers) (0.15.2)\n",
+            "Requirement already satisfied: safetensors>=0.4.1 in /usr/local/lib/python3.10/dist-packages (from transformers) (0.4.2)\n",
+            "Requirement already satisfied: tqdm>=4.27 in /usr/local/lib/python3.10/dist-packages (from transformers) (4.66.2)\n",
+            "Requirement already satisfied: fsspec>=2023.5.0 in /usr/local/lib/python3.10/dist-packages (from huggingface-hub<1.0,>=0.19.3->transformers) (2023.6.0)\n",
+            "Requirement already satisfied: typing-extensions>=3.7.4.3 in /usr/local/lib/python3.10/dist-packages (from huggingface-hub<1.0,>=0.19.3->transformers) (4.10.0)\n",
+            "Requirement already satisfied: charset-normalizer<4,>=2 in /usr/local/lib/python3.10/dist-packages (from requests->transformers) (3.3.2)\n",
+            "Requirement already satisfied: idna<4,>=2.5 in /usr/local/lib/python3.10/dist-packages (from requests->transformers) (3.6)\n",
+            "Requirement already satisfied: urllib3<3,>=1.21.1 in /usr/local/lib/python3.10/dist-packages (from requests->transformers) (2.0.7)\n",
+            "Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.10/dist-packages (from requests->transformers) (2024.2.2)\n"
+          ]
+        }
+      ],
+      "source": [
+        "!pip install transformers"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": 25,
+      "metadata": {
+        "id": "TMLnV5aMtSco"
+      },
+      "outputs": [],
+      "source": [
+        "from transformers.modeling_utils import PreTrainedModel ,PretrainedConfig"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": 27,
+      "metadata": {
+        "id": "oP9ODxPxtWPI"
+      },
+      "outputs": [],
+      "source": [
+        "class Seq2SeqTransformer(PreTrainedModel):\n",
+        "    def __init__(self,config):\n",
+        "        super(Seq2SeqTransformer, self).__init__(config)\n",
+        "        self.transformer = Transformer(d_model=config.emb_size,\n",
+        "                                       nhead=config.nhead,\n",
+        "                                       num_encoder_layers=config.num_encoder_layers,\n",
+        "                                       num_decoder_layers=config.num_decoder_layers,\n",
+        "                                       dim_feedforward=config.dim_feedforward,\n",
+        "                                       dropout=config.dropout)\n",
+        "        self.generator = nn.Linear(config.emb_size, config.tgt_vocab_size)\n",
+        "        self.src_tok_emb = TokenEmbedding(config.src_vocab_size, config.emb_size)\n",
+        "        self.tgt_tok_emb = TokenEmbedding(config.tgt_vocab_size, config.emb_size)\n",
+        "        self.positional_encoding = PositionalEncoding(\n",
+        "            config.emb_size, dropout=config.dropout)"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": 30,
+      "metadata": {
+        "id": "_uOmJ7oQtdVF"
+      },
+      "outputs": [],
+      "source": [
+        "config = PretrainedConfig(\n",
+        "      # Specify your vocabulary size\n",
+        "    dim_feedforward =512,\n",
+        "    dropout= 0.1,\n",
+        "    emb_size= 512,\n",
+        "    num_decoder_layers= 3,\n",
+        "    num_encoder_layers= 3,\n",
+        "    nhead= 8,\n",
+        "    src_vocab_size= 19214,\n",
+        "    tgt_vocab_size= 10837\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": 33,
+      "metadata": {
+        "id": "DO15AHGZtjwA"
+      },
+      "outputs": [],
+      "source": [
+        "model = Seq2SeqTransformer(config)\n",
+        "model.to(DEVICE)\n",
+        "\n",
+        "\n",
+        "model.save_pretrained('/gdrive/My Drive')"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "!pip install -q gradio==3.48.0"
+      ],
+      "metadata": {
+        "colab": {
+          "base_uri": "https://localhost:8080/"
+        },
+        "id": "vJicfSC62R86",
+        "outputId": "ddb7f709-daff-4376-e15a-d936397e8ec3"
+      },
+      "execution_count": 35,
+      "outputs": [
+        {
+          "output_type": "stream",
+          "name": "stdout",
+          "text": [
+            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m20.3/20.3 MB\u001b[0m \u001b[31m57.3 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m91.9/91.9 kB\u001b[0m \u001b[31m11.2 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+            "\u001b[?25h  Preparing metadata (setup.py) ... \u001b[?25l\u001b[?25hdone\n",
+            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m299.2/299.2 kB\u001b[0m \u001b[31m34.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m75.6/75.6 kB\u001b[0m \u001b[31m10.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m144.8/144.8 kB\u001b[0m \u001b[31m17.3 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m60.8/60.8 kB\u001b[0m \u001b[31m8.0 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m129.9/129.9 kB\u001b[0m \u001b[31m15.9 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m58.3/58.3 kB\u001b[0m \u001b[31m7.1 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m71.9/71.9 kB\u001b[0m \u001b[31m9.8 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+            "\u001b[2K     \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m77.9/77.9 kB\u001b[0m \u001b[31m10.3 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
+            "\u001b[?25h  Building wheel for ffmpy (setup.py) ... \u001b[?25l\u001b[?25hdone\n"
+          ]
+        }
+      ]
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "import gradio as gr\n",
+        "import torch\n",
+        "from torchtext.data.utils import get_tokenizer\n",
+        "from torchtext.vocab import build_vocab_from_iterator\n",
+        "from torchtext.datasets import Multi30k\n",
+        "from torch import Tensor\n",
+        "from typing import Iterable, List\n",
+        "\n",
+        "# Define your model, tokenizer, and other necessary components here\n",
+        "# Ensure you have imported all necessary libraries\n",
+        "\n",
+        "# Load your transformer model\n",
+        "model = Seq2SeqTransformer(NUM_ENCODER_LAYERS, NUM_DECODER_LAYERS, EMB_SIZE,\n",
+        "                           NHEAD, SRC_VOCAB_SIZE, TGT_VOCAB_SIZE, FFN_HID_DIM)\n",
+        "device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')\n",
+        "model.load_state_dict(torch.load('/gdrive/My Drive/transformer_model.pth', map_location=device))\n",
+        "model.eval()\n",
+        "\n",
+        "\n",
+        "def translate(model: torch.nn.Module, src_sentence: str):\n",
+        "    model.eval()\n",
+        "    src = text_transform[SRC_LANGUAGE](src_sentence).view(-1, 1)\n",
+        "    num_tokens = src.shape[0]\n",
+        "    src_mask = (torch.zeros(num_tokens, num_tokens)).type(torch.bool)\n",
+        "    tgt_tokens = greedy_decode(\n",
+        "        model,  src, src_mask, max_len=num_tokens + 5, start_symbol=BOS_IDX).flatten()\n",
+        "    return \" \".join(vocab_transform[TGT_LANGUAGE].lookup_tokens(list(tgt_tokens.cpu().numpy()))).replace(\"<bos>\", \"\").replace(\"<eos>\", \"\")\n",
+        "\n",
+        "\n"
+      ],
+      "metadata": {
+        "colab": {
+          "base_uri": "https://localhost:8080/"
+        },
+        "id": "wgBhx0w7-EUa",
+        "outputId": "170f3d83-5c56-4cc6-da52-273b8f63e885"
+      },
+      "execution_count": 90,
+      "outputs": [
+        {
+          "output_type": "stream",
+          "name": "stderr",
+          "text": [
+            "/usr/local/lib/python3.10/dist-packages/torch/nn/modules/transformer.py:286: UserWarning: enable_nested_tensor is True, but self.use_nested_tensor is False because encoder_layer.self_attn.batch_first was not True(use batch_first for better inference performance)\n",
+            "  warnings.warn(f\"enable_nested_tensor is True, but self.use_nested_tensor is False because {why_not_sparsity_fast_path}\")\n"
+          ]
+        }
+      ]
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "if __name__ == \"__main__\":\n",
+        "    # Create the Gradio interface\n",
+        "    iface = gr.Interface(\n",
+        "        fn=translate,  # Specify the translation function as the main function\n",
+        "        inputs=[\n",
+        "            gr.inputs.Textbox(label=\"Text\"),\n",
+        "            gr.inputs.Textbox(label=\"Text\")\n",
+        "\n",
+        "    ],\n",
+        "        outputs=[\"text\"],  # Define the output type as text\n",
+        "        #examples=[[\"I'm ready\", \"english\", \"arabic\"]],  # Provide an example input for demonstration\n",
+        "        cache_examples=False,  # Disable caching of examples\n",
+        "        title=\"germanToenglish\",  # Set the title of the interface\n",
+        "        #description=\"This is a translator app for arabic and english. Currently supports only english to arabic.\"  # Add a description of the interface\n",
+        "    )\n",
+        "\n",
+        "    # Launch the interface\n",
+        "    iface.launch(share=True)"
+      ],
+      "metadata": {
+        "colab": {
+          "base_uri": "https://localhost:8080/",
+          "height": 819
+        },
+        "id": "y9CN022m-hGQ",
+        "outputId": "34971409-3c9d-46a8-a741-e785d597d18c"
+      },
+      "execution_count": 91,
+      "outputs": [
+        {
+          "output_type": "stream",
+          "name": "stderr",
+          "text": [
+            "<ipython-input-91-b142228ac367>:6: GradioDeprecationWarning: Usage of gradio.inputs is deprecated, and will not be supported in the future, please import your component from gradio.components\n",
+            "  gr.inputs.Textbox(label=\"Text\"),\n",
+            "<ipython-input-91-b142228ac367>:6: GradioDeprecationWarning: `optional` parameter is deprecated, and it has no effect\n",
+            "  gr.inputs.Textbox(label=\"Text\"),\n",
+            "<ipython-input-91-b142228ac367>:6: GradioDeprecationWarning: `numeric` parameter is deprecated, and it has no effect\n",
+            "  gr.inputs.Textbox(label=\"Text\"),\n",
+            "<ipython-input-91-b142228ac367>:7: GradioDeprecationWarning: Usage of gradio.inputs is deprecated, and will not be supported in the future, please import your component from gradio.components\n",
+            "  gr.inputs.Textbox(label=\"Text\")\n",
+            "<ipython-input-91-b142228ac367>:7: GradioDeprecationWarning: `optional` parameter is deprecated, and it has no effect\n",
+            "  gr.inputs.Textbox(label=\"Text\")\n",
+            "<ipython-input-91-b142228ac367>:7: GradioDeprecationWarning: `numeric` parameter is deprecated, and it has no effect\n",
+            "  gr.inputs.Textbox(label=\"Text\")\n"
+          ]
+        },
+        {
+          "output_type": "stream",
+          "name": "stdout",
+          "text": [
+            "Colab notebook detected. To show errors in colab notebook, set debug=True in launch()\n",
+            "Running on public URL: https://05da874e546ecf0271.gradio.live\n",
+            "\n",
+            "This share link expires in 72 hours. For free permanent hosting and GPU upgrades, run `gradio deploy` from Terminal to deploy to Spaces (https://huggingface.co/spaces)\n"
+          ]
+        },
+        {
+          "output_type": "display_data",
+          "data": {
+            "text/plain": [
+              "<IPython.core.display.HTML object>"
+            ],
+            "text/html": [
+              "<div><iframe src=\"https://05da874e546ecf0271.gradio.live\" width=\"100%\" height=\"500\" allow=\"autoplay; camera; microphone; clipboard-read; clipboard-write;\" frameborder=\"0\" allowfullscreen></iframe></div>"
+            ]
+          },
+          "metadata": {}
+        }
+      ]
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "if __name__ == \"__main__\":\n",
+        "    # Create the Gradio interface\n",
+        "    iface = gr.Interface(\n",
+        "        fn=translate,  # Specify the translation function as the main function\n",
+        "        inputs=[\n",
+        "            gr.components.Textbox(label=\"Text\"),  # Add a textbox input for entering text\n",
+        "            gr.components.Dropdown(label=\"Source Language\", choices=language),  # Add a dropdown for selecting source language\n",
+        "            gr.components.Dropdown(label=\"Target Language\", choices=language),  # Add a dropdown for selecting target language\n",
+        "        ],\n",
+        "        outputs=[\"text\"],  # Define the output type as text\n",
+        "        #examples=[[\"I'm ready\", \"english\", \"arabic\"]],  # Provide an example input for demonstration\n",
+        "        cache_examples=False,  # Disable caching of examples\n",
+        "        title=\"germanToenglish\",  # Set the title of the interface\n",
+        "        #description=\"This is a translator app for arabic and english. Currently supports only english to arabic.\"  # Add a description of the interface\n",
+        "    )\n",
+        "\n",
+        "    # Launch the interface\n",
+        "    iface.launch(share=True)"
+      ],
+      "metadata": {
+        "colab": {
+          "base_uri": "https://localhost:8080/",
+          "height": 680
+        },
+        "id": "NRTdTJ8E72LQ",
+        "outputId": "6d76e9c7-8f46-498b-e0a6-b6aa74b48fc6"
+      },
+      "execution_count": 45,
+      "outputs": [
+        {
+          "output_type": "stream",
+          "name": "stderr",
+          "text": [
+            "/usr/local/lib/python3.10/dist-packages/gradio/utils.py:812: UserWarning: Expected 2 arguments for function <function translate at 0x7d1bb879fc70>, received 3.\n",
+            "  warnings.warn(\n",
+            "/usr/local/lib/python3.10/dist-packages/gradio/utils.py:820: UserWarning: Expected maximum 2 arguments for function <function translate at 0x7d1bb879fc70>, received 3.\n",
+            "  warnings.warn(\n"
+          ]
+        },
+        {
+          "output_type": "stream",
+          "name": "stdout",
+          "text": [
+            "Colab notebook detected. To show errors in colab notebook, set debug=True in launch()\n",
+            "Running on public URL: https://652be12920500f856f.gradio.live\n",
+            "\n",
+            "This share link expires in 72 hours. For free permanent hosting and GPU upgrades, run `gradio deploy` from Terminal to deploy to Spaces (https://huggingface.co/spaces)\n"
+          ]
+        },
+        {
+          "output_type": "display_data",
+          "data": {
+            "text/plain": [
+              "<IPython.core.display.HTML object>"
+            ],
+            "text/html": [
+              "<div><iframe src=\"https://652be12920500f856f.gradio.live\" width=\"100%\" height=\"500\" allow=\"autoplay; camera; microphone; clipboard-read; clipboard-write;\" frameborder=\"0\" allowfullscreen></iframe></div>"
+            ]
+          },
+          "metadata": {}
+        }
+      ]
+    },
+    {
+      "cell_type": "code",
+      "source": [],
+      "metadata": {
+        "id": "5RuYPqUT3M3M"
+      },
+      "execution_count": null,
+      "outputs": []
+    }
+  ],
+  "metadata": {
+    "accelerator": "GPU",
+    "colab": {
+      "gpuType": "T4",
+      "provenance": []
+    },
+    "kernelspec": {
+      "display_name": "Python 3",
+      "name": "python3"
+    },
+    "language_info": {
+      "name": "python"
+    }
+  },
+  "nbformat": 4,
+  "nbformat_minor": 0
+}