Support for Keras compatible classifiers (scikit-multilearn#138)

niedakh · web-flow · commit a7e3cbbf3149 · 2018-12-09T08:18:00.000+01:00
Implement wrapper for Keras scikit-compatible wraper.
diff --git a/.travis.yml b/.travis.yml
@@ -42,10 +42,16 @@ install:
 - if [[ "$TRAVIS_OS_NAME" != "osx" ]];   then docker run -e "MEKA_CLASSPATH=/opt/meka/lib/" -v "$TRAVIS_BUILD_DIR:/home/python-dev/repo" --name scikit_multilearn_dev_test_docker -d niedakh/scikit-multilearn-dev:latest; fi
 - if [[ "$TOXENV" == "linux_py2" ]]; then docker exec -it scikit_multilearn_dev_test_docker pip install -r /home/python-dev/repo/requirements-all.txt; fi
 - if [[ "$TOXENV" == "linux_py3" ]]; then docker exec -it scikit_multilearn_dev_test_docker pip3 install -r /home/python-dev/repo/requirements-all.txt; fi
+- if [[ "$TOXENV" == "linux_py2" ]]; then docker exec -it scikit_multilearn_dev_test_docker pip install -r /home/python-dev/repo/requirements/keras.txt; fi
+- if [[ "$TOXENV" == "linux_py3" ]]; then docker exec -it scikit_multilearn_dev_test_docker pip3 install -r /home/python-dev/repo/requirements/keras.txt; fi
 - if [[ "$TRAVIS_OS_NAME" != "osx" ]];   then find $TRAVIS_BUILD_DIR -name \*.pyc -delete; fi
 
 - if [[ "$TRAVIS_OS_NAME" == "osx" ]];   then cd $TRAVIS_BUILD_DIR && pip install -r requirements-all.txt ; fi
+- if [[ "$TRAVIS_OS_NAME" == "osx" ]];   then cd $TRAVIS_BUILD_DIR && pip install -r requirements/keras.txt; fi
 - if [[ "$TRAVIS_OS_NAME" == "osx" ]];   then cd $TRAVIS_BUILD_DIR && pip3 install -r requirements-all.txt; fi
+- if [[ "$TRAVIS_OS_NAME" == "osx" ]];   then cd $TRAVIS_BUILD_DIR && pip3 install https://storage.googleapis.com/tensorflow/mac/cpu/tensorflow-1.12.0-py3-none-any.whl; fi
+- if [[ "$TRAVIS_OS_NAME" == "osx" ]];   then cd $TRAVIS_BUILD_DIR && pip3 install -r requirements/keras.txt; fi
+
 notifications:
   slack:
     secure: aTCuexl+J0s+ll8sS+p65Atmr9hgOYg0Qkv1nOwb+2oVlJtIYpwLymYZdMymeMtcbK8nlCKGuZRj9jpowzLvSU5kmmmbUdCskEzLf8guE/TUN5iMcIdvKnlAxfJ/MBXw59bjIuF3saYmzpkYbaBvj150M/tXMkYMLSgqwFMQq6U=
diff --git a/appveyor.yml b/appveyor.yml
@@ -28,22 +28,26 @@ environment:
     - PYTHON: "C:\\Python27.10"
       PYTHON_VERSION: "2.7.10"
       PYTHON_ARCH: "32"
+      HAS_KERAS: "0"
 
     - PYTHON: "C:\\Python27.10-x64"
       PYTHON_VERSION: "2.7.10"
       PYTHON_ARCH: "64"
+      HAS_KERAS: "0"
 
     # Pre-installed Python versions, which Appveyor may upgrade to
     # a later point release.
     # See: http://www.appveyor.com/docs/installed-software#python
 
-    - PYTHON: "C:\\Python34"
-      PYTHON_VERSION: "3.4.x" # currently 3.4.3
+    - PYTHON: "C:\\Python35"
+      PYTHON_VERSION: "3.6.x" # currently 3.4.3
       PYTHON_ARCH: "32"
+      HAS_KERAS: "0"
 
-    - PYTHON: "C:\\Python34-x64"
-      PYTHON_VERSION: "3.4.x" # currently 3.4.3
+    - PYTHON: "C:\\Python36-x64"
+      PYTHON_VERSION: "3.6.x" # currently 3.4.3
       PYTHON_ARCH: "64"
+      HAS_KERAS: "1"
 
 
 install:
@@ -90,6 +94,7 @@ install:
   # target Python version and architecture
   - "pip install -r requirements\\base.txt"
   - "pip install -r requirements\\meka.txt"
+  - ps: If ($env:HAS_KERAS -eq "1")  { & pip install -r requirements\\keras.txt }
   # - "pip install -r requirements\\gpl.txt"
   - "pip install -r requirements\\test.txt"
 
diff --git a/docs/source/index.rst b/docs/source/index.rst
@@ -29,7 +29,7 @@
 
     <div class="section">
       <div class="row">
-        <div class="col feature s12 m12 l6">
+        <div class="col feature s12 m6 l4">
           <div class="card  blue-grey darken-3">
             <div class="card-content white-text">
               <span class="card-title"><i class="fas fa-brain"></i> Lots of classifiers</span>
@@ -42,7 +42,7 @@
           </div>
         </div>
 
-        <div class="col feature s12 m6 l6">
+        <div class="col feature s12 m6 l4">
           <div class="card  blue-grey lighten-5">
             <div class="card-content black-text">
               <span class="card-title"><i class="fab fa-connectdevelop"></i> Label Relations</span>
@@ -107,14 +107,28 @@
             <div class="card-content white-text">
               <span class="card-title"><i class="fas fa-box-open"></i> MEKA wrapper</span>
               <p>Missing a particular classifier which exists in the Java MEKA and WEKA stack?
-              Now you can use it like a native scikit classifier!.</p>
+              Now you can use it like a native scikit classifier!</p>
             </div>
             <div class="card-action right-align">
               <a href="meka.html" class="waves-effect waves-light btn">Using MEKA</a>
             </div>
           </div>
         </div>
 
+
+        <div class="col feature s12 m6 l4">
+          <div class="card  blue-grey lighten-5">
+            <div class="card-content black-text">
+              <span class="card-title"><b>K</b> Keras support</span>
+              <p>Need a particular deep learning single/multi class classifier? You can now use it for multi-label
+              problems with scikit-multilearn!</p>
+            </div>
+            <div class="card-action right-align">
+              <a href="keras.html" class="waves-effect waves-light btn">Using Keras</a>
+            </div>
+          </div>
+        </div>
+
         <div class="col feature s12 m6 l4">
           <div class="card  blue-grey lighten-5">
             <div class="card-content black-text">
diff --git a/docs/source/keras.ipynb b/docs/source/keras.ipynb
@@ -0,0 +1,260 @@
+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": 103,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from skmultilearn.ext import Keras\n",
+    "from keras.models import Sequential\n",
+    "from keras.layers import Dense\n",
+    "import numpy\n",
+    "import sklearn.metrics as metrics\n",
+    "from skmultilearn.dataset import load_dataset"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "X_train, y_train, feature_names, label_names = load_dataset('emotions', 'train')\n",
+    "X_test, y_test, _, _ = load_dataset('emotions', 'test')"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "# Single-class Keras classifier"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "We train a two-layer neural network using Keras and tensortflow as backend (feel free to use others), the network is fairly simple 12 x 8 RELU that finish with a sigmoid activator optimized via binary cross entropy. This is a case from the [Keras example page](https://keras.io/scikit-learn-api/). Note that the model creation function must create a model that accepts an input dimension and outpus a relevant output dimension. The Keras wrapper from scikit-multilearn will pass relevant dimensions upon fitting. "
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 105,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "def create_model_single_class(input_dim, output_dim):\n",
+    "\t# create model\n",
+    "\tmodel = Sequential()\n",
+    "\tmodel.add(Dense(12, input_dim=input_dim, activation='relu'))\n",
+    "\tmodel.add(Dense(8, activation='relu'))\n",
+    "\tmodel.add(Dense(output_dim, activation='sigmoid'))\n",
+    "\t# Compile model\n",
+    "\tmodel.compile(loss='binary_crossentropy', optimizer='adam', metrics=['accuracy'])\n",
+    "\treturn model"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "Let's use it with a problem transformation method which converts multi-label classification problems to single-label single-class problems, ex. Binary Relevance which trains a classifier per label."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 123,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from skmultilearn.problem_transform import BinaryRelevance"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 126,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "clf = BinaryRelevance(classifier=Keras(create_model_single_class), require_dense=[True,True])"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 127,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "BinaryRelevance(classifier=<__main__.Keras object at 0x7f4d0b040978>,\n",
+       "        require_dense=[True, True])"
+      ]
+     },
+     "execution_count": 127,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "clf.fit(X_train,y_train)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 130,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "y_pred = clf.predict(X_test)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 133,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "0.25495049504950495"
+      ]
+     },
+     "execution_count": 133,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "metrics.hamming_loss(y_test, y_pred)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "# Single-class Keras classifier"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "We now train a multi-class neural network using Keras and tensortflow as backend (feel free to use others) optimized via categorical cross entropy. This is a case from the [Keras multi-class tutorial](https://machinelearningmastery.com/multi-class-classification-tutorial-keras-deep-learning-library/). Note again that the model creation function must create a model that accepts an input dimension and outpus a relevant output dimension. The Keras wrapper from scikit-multilearn will pass relevant dimensions upon fitting. We must also tel the Keras wrapper that this is a multi-class case. We use the Label Powerset multi-label to multi-class transformation approach, but this can also be used with all the advanced label space division methods available in scikit-multilearn."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 136,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from skmultilearn.problem_transform import LabelPowerset"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 137,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "def create_model_multiclass(input_dim, output_dim):\n",
+    "\t# create model\n",
+    "\tmodel = Sequential()\n",
+    "\tmodel.add(Dense(8, input_dim=input_dim, activation='relu'))\n",
+    "\tmodel.add(Dense(output_dim, activation='softmax'))\n",
+    "\t# Compile model\n",
+    "\tmodel.compile(loss='categorical_crossentropy', optimizer='adam', metrics=['accuracy'])\n",
+    "\treturn model"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 138,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "clf = LabelPowerset(classifier=Keras(create_model_multiclass, multi_class=True), require_dense=[True,True])"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 139,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "LabelPowerset(classifier=<__main__.Keras object at 0x7f4d09229be0>,\n",
+       "       require_dense=[True, True])"
+      ]
+     },
+     "execution_count": 139,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "clf.fit(X_train,y_train)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 140,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "y_pred = clf.predict(X_test)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 142,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "0.22277227722772278"
+      ]
+     },
+     "execution_count": 142,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "metrics.accuracy_score(y_test, y_pred)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.6.6"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}
diff --git a/requirements/keras.txt b/requirements/keras.txt
@@ -0,0 +1,2 @@
+keras
+tensorflow
diff --git a/skmultilearn/ext/__init__.py b/skmultilearn/ext/__init__.py
@@ -10,11 +10,19 @@
 | :class:`~skmultilearn.ext.Meka`            | Wrapper for the Multilabel Extension to WEKA -                   |
 |                                            | `MEKA <http://meka.sf.net>`_ library                             |
 +--------------------------------------------+------------------------------------------------------------------+
+| :class:`~skmultilearn.ext.Keras`           | Wrapper for the Python Deep Learning library -                   |
+|                                            | `KERAS <http://https://keras.io/>`_                              |
++--------------------------------------------+------------------------------------------------------------------+
 | :func:`~skmultilearn.ext.download_meka`    | Helper function for installing MEKA                              |
 +--------------------------------------------+------------------------------------------------------------------+
 
 """
 
+import sys, platform
 from .meka import Meka, download_meka
 
 __all__ = ["Meka", 'download_meka']
+
+if not (sys.version_info[0] == 2 or platform.architecture()[0]=='32bit'):
+    from .keras import Keras
+    __all__ += ['Keras']
diff --git a/skmultilearn/ext/keras.py b/skmultilearn/ext/keras.py
diff --git a/skmultilearn/ext/tests/test_keras.py b/skmultilearn/ext/tests/test_keras.py