biodatlab
diff --git a/‎ml-app-gradio/2_Machine-translation.ipynb
Lines changed: 109 additions & 0 deletions b/‎ml-app-gradio/2_Machine-translation.ipynb
Lines changed: 109 additions & 0 deletions
diff --git a/‎ml-app-gradio/3_Speech-2-text.ipynb
Lines changed: 51 additions & 13 deletions b/‎ml-app-gradio/3_Speech-2-text.ipynb
Lines changed: 51 additions & 13 deletions
diff --git a/‎ml-app-gradio/4_Text-2-image.ipynb
Lines changed: 12 additions & 7 deletions b/‎ml-app-gradio/4_Text-2-image.ipynb
Lines changed: 12 additions & 7 deletions
diff --git a/‎ml-app-gradio/2_Image-2-text.ipynb renamed to ‎ml-app-gradio/5_Image-2-text.ipynb
Lines changed: 14 additions & 38 deletions b/‎ml-app-gradio/2_Image-2-text.ipynb renamed to ‎ml-app-gradio/5_Image-2-text.ipynb
Lines changed: 14 additions & 38 deletions
diff --git a/‎ml-app-gradio/5_Machine_translation.ipynb
Lines changed: 0 additions & 16 deletions b/‎ml-app-gradio/5_Machine_translation.ipynb
Lines changed: 0 additions & 16 deletions
diff --git a/‎ml-app-gradio/audio_example/audio.mp3
1.61 MB b/‎ml-app-gradio/audio_example/audio.mp3
1.61 MB
diff --git a/‎ml-app-gradio/ุุ6_Chatbot.ipynb b/‎ml-app-gradio/ุุ6_Chatbot.ipynb
@@ -0,0 +1,109 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "# Machine Translation\n",
+    "\n",
+    "What is machine translation\n",
+    "- Translation converts a sequence of text from one language to another. \n",
+    "\n",
+    "\n",
+    "Reference > https://huggingface.co/docs/transformers/en/tasks/translation"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "!pip install transformers[sentencepiece]"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "##### The tranlation model is processing the source group to target group.\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from transformers import pipeline\n",
+    "\n",
+    "# English to French\n",
+    "translator = pipeline(\"translation_xx_to_yy\", model=\"google-t5/t5-small\")\n",
+    "\n",
+    "## Translate English to French\n",
+    "text = \"translate English to French: Legumes share resources with nitrogen-fixing bacteria.\" \n",
+    "\n",
+    "print(translator(text)) "
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Translation TH-ENG model"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "## Load the pre-trained model\n",
+    "pipeline = pipeline(\"translation\", model=\"Helsinki-NLP/opus-mt-th-en\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "- Model \"Helsinnki-NLP/opus-mt-th-enn\"\n",
+    "- Source group : Thai\n",
+    "- Target group : English"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "## this model is for Thai to Englist translation\n",
+    "\n",
+    "text = \"translate Thai to Englist : สวัสดีครับ ยินดีที่ได้รู้จักครับ\"\n",
+    "print(pipeline(text))"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "biomedparse",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.9.19"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}
@@ -28,19 +28,18 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 2,
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "!pip install transformers"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
    "metadata": {},
-   "outputs": [
-    {
-     "name": "stderr",
-     "output_type": "stream",
-     "text": [
-      "/home/badboy-005/anaconda3/envs/biomedparse/lib/python3.9/site-packages/tqdm/auto.py:21: TqdmWarning: IProgress not found. Please update jupyter and ipywidgets. See https://ipywidgets.readthedocs.io/en/stable/user_install.html\n",
-      "  from .autonotebook import tqdm as notebook_tqdm\n",
-      "Device set to use cuda:0\n"
-     ]
-    }
-   ],
+   "outputs": [],
    "source": [
     "from transformers import pipeline\n",
     "import torch\n",
@@ -69,7 +68,46 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "text = pipe(\"audio.mp3\")[\"text\"] # give audio mp3 and transcribe text"
+    "!pip install pytubefix"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# importing packages\n",
+    "from pytubefix import YouTube\n",
+    "import os\n",
+    "\n",
+    "yt = YouTube(\"https://www.youtube.com/watch?v=IoO07mDIBr4&list=RDIoO07mDIBr4&start_radio=1\")\n",
+    "\n",
+    "video = yt.streams.filter(only_audio=True).first()\n",
+    "os.makedirs(\"audio_example\", exist_ok=True)\n",
+    "out_file = video.download(output_path=\"audio_example\")\n",
+    "\n",
+    "new_file = \"audio_example/audio\" + '.mp3'\n",
+    "os.rename(out_file, new_file)\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "text = pipe(\"audio_example/audio.mp3\")[\"text\"] # give audio mp3 and transcribe text\n",
+    "## this would take a while to process"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "print(text)"
    ]
   }
  ],
 
@@ -9,12 +9,24 @@
     "!pip install diffusers"
    ]
   },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Text-2-image\n",
+    "\n",
+    "- Text-to-image is the task of generating images from input text.\n",
+    "\n",
+    "Reference : https://huggingface.co/tasks/text-to-image"
+   ]
+  },
   {
    "cell_type": "code",
    "execution_count": null,
    "metadata": {},
    "outputs": [],
    "source": [
+    "# Importing the required libraries\n",
     "import gradio as gr\n",
     "from diffusers import StableDiffusionPipeline\n",
     "import torch"
@@ -48,13 +60,6 @@
     "# Launch the interface\n",
     "demo.launch()"
    ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": []
   }
  ],
  "metadata": {
 
@@ -11,8 +11,7 @@
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "From the previous notebook, we understand the basic concept of gradio application\n",
-    "and how to use it. \n",
+    "- Image to text models output a text from a given image.\n",
     "\n",
     "In this notebook,we will use the LLaVA model which is the multimodal\n",
     "model that can generate text from the image. "
@@ -110,18 +109,10 @@
     "    max_new_tokens=100\n",
     ")\n",
     "\n",
-    "output_text = processor.batch_decode(generate_ids, skip_special_tokens=True) # Decode the generated text"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "print(output_text)\n",
+    "output_text = processor.batch_decode(generate_ids, skip_special_tokens=True) # Decode the generated text\n",
     "\n",
-    "## The output text is contain \"USER\" input and the generated text from the model"
+    "## The output text is contain \"USER\" input and the generated text from the model\n",
+    "print(output_text)"
    ]
   },
   {
@@ -146,33 +137,17 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 6,
+   "execution_count": null,
    "metadata": {},
    "outputs": [],
    "source": [
+    "# TODO : Try to put image-2-text in gradio platform and see the output\n",
+    "\n",
     "def generate_description(image, prompt = \"What is shown in this image?\", max_new_tokens=200):\n",
-    "    \n",
-    "    conversation = [\n",
-    "        {\n",
-    "            \"role\": \"user\",\n",
-    "            \"content\": [\n",
-    "                {\"type\": \"image\"},\n",
-    "                {\"type\": \"text\", \"text\": prompt},\n",
-    "            ],\n",
-    "        },\n",
-    "    ]\n",
-    "    prompt = processor.apply_chat_template(conversation, add_generation_prompt=True)\n",
-    "    inputs = processor(\n",
-    "        images=[image],\n",
-    "        text=[prompt],\n",
-    "        return_tensors=\"pt\"\n",
-    "    ).to(device=\"cuda\", dtype=torch.float16)\n",
-    "    generate_ids = model.generate(\n",
-    "        **inputs,\n",
-    "        do_sample=True,\n",
-    "        max_new_tokens=max_new_tokens\n",
-    "    )\n",
-    "    generated_description = processor.batch_decode(generate_ids, skip_special_tokens=True)\n",
+    "    \"\"\"\n",
+    "    Generate a description of the image using the model\n",
+    "    \"\"\"\n",
+    "    ## Guide : use the above code as the reference to write the code\n",
     "\n",
     "    return generated_description[0]"
    ]
@@ -218,13 +193,14 @@
     "import gradio as gr\n",
     "\n",
     "demo = gr.Interface(\n",
-    "    fn=lambda img, prompt: generate_description(img, prompt),\n",
+    "    fn=lambda img, prompt: ... , ## put the function here\n",
     "    inputs=[gr.Image(type=\"pil\"),\n",
-    "            gr.Textbox(label=\"prompt\", value=\"What is shown in this image?\", lines=3)],  # Changed to numpy\n",
+    "            gr.Textbox(label=\"prompt\", value=\"What is shown in this image?\", lines=3)],  \n",
     "    outputs=[gr.Textbox(label=\"Description\", lines=3)],\n",
     "    title=\"Image Description using LLaVA\",\n",
     "    description=\"Upload an image to get a detailed description using LLaVA-1.5-7b\",\n",
     ")\n",
+    "\n",
     "demo.launch()"
    ]
   },