Sony
/

AKI-4B-phi-3.5-mini

Image-Text-to-Text

Safetensors

English

conversational

Model card Files Files and versions Community

SwyWang commited on 14 days ago

Commit

49d5b39

verified ·

1 Parent(s): 7eb0198

Upload demo.ipynb

Browse files

Files changed (1) hide show

demo.ipynb +110 -7

demo.ipynb CHANGED Viewed

@@ -25,7 +25,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 2,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -66,6 +66,76 @@
    "execution_count": null,
    "metadata": {},
    "outputs": [
     {
      "name": "stderr",
      "output_type": "stream",
@@ -79,7 +149,7 @@
     {
      "data": {
       "application/vnd.jupyter.widget-view+json": {
-       "model_id": "64e0aee907ed4b29b238f38b74762f95",
        "version_major": 2,
        "version_minor": 0
       },
@@ -90,17 +160,30 @@
      "metadata": {},
      "output_type": "display_data"
     },
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Loading weights from local directory\n",
       "Model initialization is done.\n"
      ]
     }
    ],
    "source": [
-    "model_path = \"aki-phi3.5-mini-4b\"\n",
     "config = AutoConfig.from_pretrained(model_path)\n",
     "# Load model, image_processor, tokenizer\n",
     "model, image_processor, tokenizer = load_model_and_processor(model_path, config=config)"
@@ -108,7 +191,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 8,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -158,7 +241,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 9,
    "metadata": {},
    "outputs": [
     {
@@ -182,7 +265,20 @@
       "<image>\n",
       "Describe the scene of this image.<|end|>\n",
       "<|assistant|>\n",
-      "\n",
       "Response:\n",
       " The image captures a beautiful autumn day in a park, with a pathway covered in a vibrant carpet of fallen leaves. The leaves are in various shades of red, orange, yellow, and brown, creating a warm and colorful atmosphere. The path is lined with trees displaying beautiful autumn foliage, adding to the picturesque setting.\n",
       "\n",
@@ -196,6 +292,13 @@
     "response = process_input(image_path, text_input)\n",
     "print(\"Response:\\n\", response)"
    ]
   }
  ],
  "metadata": {

   },
   {
    "cell_type": "code",
+   "execution_count": null,
    "metadata": {},
    "outputs": [],
    "source": [
    "execution_count": null,
    "metadata": {},
    "outputs": [
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "09f13b1e5bae415f9f6a123d836b1d47",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "config.json:   0%|          | 0.00/387 [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "e6f700961c5c4da3b326106d2dae74a2",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "tokenizer_config.json:   0%|          | 0.00/3.99k [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "9254a5341c3e44eeba3f2aed206701e5",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "tokenizer.model:   0%|          | 0.00/500k [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "7fadd9569a1549a2a81e4f0742d6910a",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "added_tokens.json:   0%|          | 0.00/358 [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "828eef207c5e4037ae41da262449b165",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "special_tokens_map.json:   0%|          | 0.00/887 [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
     {
      "name": "stderr",
      "output_type": "stream",
     {
      "data": {
       "application/vnd.jupyter.widget-view+json": {
+       "model_id": "4d2309ed29bb477d991fa95f556dbb4e",
        "version_major": 2,
        "version_minor": 0
       },
      "metadata": {},
      "output_type": "display_data"
     },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "5d125663ad7f46c0b4820ea4d236f01a",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "model.safetensors:   0%|          | 0.00/17.3G [00:00<?, ?B/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
       "Model initialization is done.\n"
      ]
     }
    ],
    "source": [
+    "model_path = \"Sony/AKI-4B-phi-3.5-mini\"\n",
     "config = AutoConfig.from_pretrained(model_path)\n",
     "# Load model, image_processor, tokenizer\n",
     "model, image_processor, tokenizer = load_model_and_processor(model_path, config=config)"
   },
   {
    "cell_type": "code",
+   "execution_count": 9,
    "metadata": {},
    "outputs": [],
    "source": [
   },
   {
    "cell_type": "code",
+   "execution_count": 10,
    "metadata": {},
    "outputs": [
     {
       "<image>\n",
       "Describe the scene of this image.<|end|>\n",
       "<|assistant|>\n",
+      "\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "You are not running the flash-attention implementation, expect numerical differences.\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
       "Response:\n",
       " The image captures a beautiful autumn day in a park, with a pathway covered in a vibrant carpet of fallen leaves. The leaves are in various shades of red, orange, yellow, and brown, creating a warm and colorful atmosphere. The path is lined with trees displaying beautiful autumn foliage, adding to the picturesque setting.\n",
       "\n",
     "response = process_input(image_path, text_input)\n",
     "print(\"Response:\\n\", response)"
    ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
   }
  ],
  "metadata": {