Spaces:

daspartho
/

is-it-huggable

Running

App Files Files Community

daspartho commited on Aug 25, 2022

Commit

fed847e

•

1 Parent(s): 02182ab

updated model

Browse files

Files changed (2) hide show

model.ipynb +273 -0
model.pkl +2 -2

model.ipynb ADDED Viewed

	@@ -0,0 +1,273 @@

+{
+  "cells": [
+    {
+      "cell_type": "markdown",
+      "metadata": {
+        "id": "FDfI95Sh1lW0"
+      },
+      "source": [
+        "# Is it Huggable?\n",
+        "*Classify objects as huggable or not.*\n",
+        "\n",
+        "This notebook has steps to make the model.\n",
+        "\n",
+        "Just want to play? Use directly on the [website](https://daspartho.github.io/is-it-huggable)."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {
+        "id": "r-GyBdvhzfY2"
+      },
+      "source": [
+        "### Install required libraries"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {
+        "id": "CQdd5Egc-FQV"
+      },
+      "outputs": [],
+      "source": [
+        "!pip install -Uqq fastai duckduckgo_search"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {
+        "id": "vgvpU91p0ERn"
+      },
+      "source": [
+        "### Import modules required"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": 2,
+      "metadata": {
+        "id": "BD7-yF0l-Y4h"
+      },
+      "outputs": [],
+      "source": [
+        "from duckduckgo_search import ddg_images\n",
+        "from fastcore.all import *\n",
+        "from fastdownload import download_url\n",
+        "from fastai.vision.all import *"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {
+        "id": "WKZC9jY_zOfx"
+      },
+      "source": [
+        "### Use DuckDuckGo to search for images of examples of the two groups"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {
+        "id": "hqnqTAXWCAn6"
+      },
+      "outputs": [],
+      "source": [
+        "def search_images(term, max_images=50):\n",
+        "    print(f\"Searching for '{term}'\")\n",
+        "    return L(ddg_images(term, max_results=max_images)).itemgot('image')\n",
+        "\n",
+        "path = Path('huggable_or_not')\n",
+        "\n",
+        "# examples of both groups\n",
+        "categories={\n",
+        "   'huggable':['plushie', 'pillow' , 'ballon', 'dog', 'cat', 'bunny', 'snowman', 'bed', 'sofa', 'people', 'baby', 'cloud', 'dolphin', 'horse', 'cow', 'sheep'], \n",
+        "   'not huggable':['chainsaw', 'sword', 'cactus', 'barbwire', 'bear', 'snake', 'lion', 'shark', 'fire','knive','fork', 'dinosaur', 'crocodile', 'spider', 'bees', 'porcupine']\n",
+        "   }\n",
+        "\n",
+        "for category in categories:\n",
+        "    dest = (path/category)\n",
+        "    dest.mkdir(exist_ok=True, parents=True)\n",
+        "    for example in categories[category]:\n",
+        "        download_images(dest, urls=search_images(f'{example} photo'))\n",
+        "        resize_images(path/category, max_size=400, dest=path/category)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {
+        "id": "Bpsp4MTGxBWl"
+      },
+      "source": [
+        "### Remove photos that didn't download correctly."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {
+        "id": "FzuHMc_qD0UO"
+      },
+      "outputs": [],
+      "source": [
+        "failed = verify_images(get_image_files(path))\n",
+        "failed.map(Path.unlink)\n",
+        "len(failed)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {
+        "id": "eFFr_VE45ihe"
+      },
+      "source": [
+        "### Preparing the data for training"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {
+        "id": "wzSeghRAFYqF"
+      },
+      "outputs": [],
+      "source": [
+        "dls = DataBlock(\n",
+        "    blocks=(ImageBlock, CategoryBlock), # inputs to our model are images, and the outputs are categories\n",
+        "    get_items=get_image_files, \n",
+        "    splitter=RandomSplitter(valid_pct=0.2, seed=42), # Split the data into training and validation sets randomly, using 20% of the data for the validation set\n",
+        "    get_y=parent_label, # The labels is the name of the parent of each file\n",
+        "    item_tfms=RandomResizedCrop(224, min_scale=0.3), # picks a random scaled crop of an image and resize it to 224x224 pixels\n",
+        "    batch_tfms=aug_transforms() # applies augmentations to an entire batch\n",
+        ").dataloaders(path, bs=32)\n",
+        "\n",
+        "dls.show_batch()"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {
+        "id": "y-FNWY-3zEF3"
+      },
+      "source": [
+        "### Fine-tune a pretrained neural network to recognise these two groups"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {
+        "id": "5ao0lw2cG2WP"
+      },
+      "outputs": [],
+      "source": [
+        "learn = vision_learner(dls, resnet34, metrics=error_rate)\n",
+        "learn.fine_tune(10)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {
+        "id": "0wZAFpxi7L6z"
+      },
+      "source": [
+        "### Show predictions the model made on images in validation set"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {
+        "id": "aE0vp3jeVtBT"
+      },
+      "outputs": [],
+      "source": [
+        "learn.show_results()"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {
+        "id": "gFpqdZr87ZSS"
+      },
+      "source": [
+        "### Download an image from internet for trying the model"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {
+        "id": "C0kfX6QUMRoN"
+      },
+      "outputs": [],
+      "source": [
+        "term='penguin' # change the search term\n",
+        "download_url(search_images(term, max_images=1)[0], 'test.jpg', show_progress=False)\n",
+        "Image.open('test.jpg').to_thumb(256,256)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {
+        "id": "AgOQPzTX7q3o"
+      },
+      "source": [
+        "### Trying the model on the downloaded image"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {
+        "id": "sz1dVCZMHz3N"
+      },
+      "outputs": [],
+      "source": [
+        "predict,n,prob = learn.predict(PILImage.create('test.jpg'))\n",
+        "print(f\"It's {predict}!\")\n",
+        "perc = prob[n]*100\n",
+        "print(f\"I'm {perc:.02f}% confident.\")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {
+        "id": "lSSjWJq874WE"
+      },
+      "source": [
+        "### Export the model"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": 94,
+      "metadata": {
+        "id": "ae2bc6ac"
+      },
+      "outputs": [],
+      "source": [
+        "learn.export('model.pkl')"
+      ]
+    }
+  ],
+  "metadata": {
+    "accelerator": "GPU",
+    "colab": {
+      "collapsed_sections": [],
+      "name": "model.ipynb",
+      "provenance": []
+    },
+    "gpuClass": "standard",
+    "kernelspec": {
+      "display_name": "Python 3",
+      "name": "python3"
+    },
+    "language_info": {
+      "name": "python"
+    }
+  },
+  "nbformat": 4,
+  "nbformat_minor": 0
+}

model.pkl CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:afbd4ed3363dd00b44ce149bf20e7d6891e96ca7280b1fa65e7ec4a0994cf115
-size 87468645

 version https://git-lfs.github.com/spec/v1
+oid sha256:8e13d90feb325569e3ac1ce4371ce77195222ac28f044a97b1620aef8f70efe2
+size 87503717