.. DO NOT EDIT.
.. THIS FILE WAS AUTOMATICALLY GENERATED BY SPHINX-GALLERY.
.. TO MAKE CHANGES, EDIT THE SOURCE PYTHON FILE:
.. "auto_examples/plot_1_example_mrc.py"
.. LINE NUMBERS ARE GIVEN BELOW.

.. only:: html

    .. note::
        :class: sphx-glr-download-link-note

        :ref:`Go to the end <sphx_glr_download_auto_examples_plot_1_example_mrc.py>`
        to download the full example code

.. rst-class:: sphx-glr-example-title

.. _sphx_glr_auto_examples_plot_1_example_mrc.py:


.. _ex1:

Example: Use of MRC with different settings
===========================================

Example of using MRC with some of the common classification datasets with
different losses and feature mappings settings. We load the different datasets
and use 10-Fold Cross-Validation to generate the partitions for train and test.
We separate 1 partition each time for testing and use the others for training.
On each iteration we calculate the classification error as well as the upper
and lower bounds for the error. We also calculate the mean training time.

Note that we set the parameter use_cvx=False. In the case of MRC classifiers
this means that we will use nesterov subgradient optimized approach to
perform the optimization.

You can check a more elaborated example in :ref:`ex_comp`.

.. GENERATED FROM PYTHON SOURCE LINES 23-130

.. code-block:: default


    import time

    import numpy as np
    import pandas as pd
    from sklearn import preprocessing
    from sklearn.model_selection import StratifiedKFold

    from MRCpy import MRC
    # Import the datasets
    from MRCpy.datasets import *

    # Data sets
    loaders = [
        load_mammographic,
        load_haberman,
        load_indian_liver,
        load_diabetes,
        load_credit,
    ]
    dataName = ["mammographic", "haberman", "indian_liver", "diabetes", "credit"]


    def runMRC(phi, loss):

        results = pd.DataFrame()
        # We fix the random seed to that the stratified kfold performed
        # is the same through the different executions
        random_seed = 0

        # Iterate through each of the dataset and fit the MRC classfier.
        for j, load in enumerate(loaders):

            # Loading the dataset
            X, Y = load()
            r = len(np.unique(Y))
            n, d = X.shape

            clf = MRC(phi=phi,
                      loss=loss,
                      random_state=random_seed,
                      max_iters=5000,
                      solver='subgrad')

            # Generate the partitions of the stratified cross-validation
            n_splits = 5
            cv = StratifiedKFold(
                n_splits=n_splits, random_state=random_seed, shuffle=True
            )

            cvError = list()
            auxTime = 0
            upper = 0
            lower = 0

            # Paired and stratified cross-validation
            for train_index, test_index in cv.split(X, Y):

                X_train, X_test = X[train_index], X[test_index]
                y_train, y_test = Y[train_index], Y[test_index]

                # Normalizing the data
                std_scale = preprocessing.StandardScaler().fit(X_train, y_train)
                X_train = std_scale.transform(X_train)
                X_test = std_scale.transform(X_test)

                # Save start time for computing training time
                startTime = time.time()

                # Train the model and save the upper and lower bounds
                clf.fit(X_train, y_train)
                upper += clf.get_upper_bound()
                lower += clf.get_lower_bound()

                # Save the training time
                auxTime += time.time() - startTime

                # Predict the class for test instances
                y_pred = clf.predict(X_test)

                # Calculate the error made by MRC classificator
                cvError.append(np.average(y_pred != y_test))

            res_mean = np.average(cvError)
            res_std = np.std(cvError)

            # Calculating the mean upper and lower bound and training time
            upper = upper / n_splits
            lower = lower / n_splits
            auxTime = auxTime / n_splits

            results = results._append(
                {
                    "dataset": dataName[j],
                    "n_samples": "%d" % n,
                    "n_attributes": "%d" % d,
                    "n_classes": "%d" % r,
                    "error": "%1.2g" % res_mean + " +/- " + "%1.2g" % res_std,
                    "upper": "%1.2g" % upper,
                    "lower": "%1.2g" % lower,
                    "avg_train_time (s)": "%1.2g" % auxTime,
                },
                ignore_index=True,
            )
        return results


.. GENERATED FROM PYTHON SOURCE LINES 131-135

.. code-block:: default


    r1 = runMRC(phi="fourier", loss="0-1")
    r1.style.set_caption("Using 0-1 loss and fourier feature mapping")


.. raw:: html

    <div class="output_subarea output_html rendered_html output_result">
    <style type="text/css">
    </style>
    <table id="T_41d03">
      <caption>Using 0-1 loss and fourier feature mapping</caption>
      <thead>
        <tr>
          <th class="blank level0" >&nbsp;</th>
          <th id="T_41d03_level0_col0" class="col_heading level0 col0" >dataset</th>
          <th id="T_41d03_level0_col1" class="col_heading level0 col1" >n_samples</th>
          <th id="T_41d03_level0_col2" class="col_heading level0 col2" >n_attributes</th>
          <th id="T_41d03_level0_col3" class="col_heading level0 col3" >n_classes</th>
          <th id="T_41d03_level0_col4" class="col_heading level0 col4" >error</th>
          <th id="T_41d03_level0_col5" class="col_heading level0 col5" >upper</th>
          <th id="T_41d03_level0_col6" class="col_heading level0 col6" >lower</th>
          <th id="T_41d03_level0_col7" class="col_heading level0 col7" >avg_train_time (s)</th>
        </tr>
      </thead>
      <tbody>
        <tr>
          <th id="T_41d03_level0_row0" class="row_heading level0 row0" >0</th>
          <td id="T_41d03_row0_col0" class="data row0 col0" >mammographic</td>
          <td id="T_41d03_row0_col1" class="data row0 col1" >961</td>
          <td id="T_41d03_row0_col2" class="data row0 col2" >5</td>
          <td id="T_41d03_row0_col3" class="data row0 col3" >2</td>
          <td id="T_41d03_row0_col4" class="data row0 col4" >0.18 +/- 0.013</td>
          <td id="T_41d03_row0_col5" class="data row0 col5" >0.23</td>
          <td id="T_41d03_row0_col6" class="data row0 col6" >0.21</td>
          <td id="T_41d03_row0_col7" class="data row0 col7" >0.69</td>
        </tr>
        <tr>
          <th id="T_41d03_level0_row1" class="row_heading level0 row1" >1</th>
          <td id="T_41d03_row1_col0" class="data row1 col0" >haberman</td>
          <td id="T_41d03_row1_col1" class="data row1 col1" >306</td>
          <td id="T_41d03_row1_col2" class="data row1 col2" >3</td>
          <td id="T_41d03_row1_col3" class="data row1 col3" >2</td>
          <td id="T_41d03_row1_col4" class="data row1 col4" >0.27 +/- 0.016</td>
          <td id="T_41d03_row1_col5" class="data row1 col5" >0.26</td>
          <td id="T_41d03_row1_col6" class="data row1 col6" >0.24</td>
          <td id="T_41d03_row1_col7" class="data row1 col7" >0.45</td>
        </tr>
        <tr>
          <th id="T_41d03_level0_row2" class="row_heading level0 row2" >2</th>
          <td id="T_41d03_row2_col0" class="data row2 col0" >indian_liver</td>
          <td id="T_41d03_row2_col1" class="data row2 col1" >583</td>
          <td id="T_41d03_row2_col2" class="data row2 col2" >10</td>
          <td id="T_41d03_row2_col3" class="data row2 col3" >2</td>
          <td id="T_41d03_row2_col4" class="data row2 col4" >0.29 +/- 0.0035</td>
          <td id="T_41d03_row2_col5" class="data row2 col5" >0.29</td>
          <td id="T_41d03_row2_col6" class="data row2 col6" >0.28</td>
          <td id="T_41d03_row2_col7" class="data row2 col7" >0.64</td>
        </tr>
        <tr>
          <th id="T_41d03_level0_row3" class="row_heading level0 row3" >3</th>
          <td id="T_41d03_row3_col0" class="data row3 col0" >diabetes</td>
          <td id="T_41d03_row3_col1" class="data row3 col1" >768</td>
          <td id="T_41d03_row3_col2" class="data row3 col2" >8</td>
          <td id="T_41d03_row3_col3" class="data row3 col3" >2</td>
          <td id="T_41d03_row3_col4" class="data row3 col4" >0.25 +/- 0.03</td>
          <td id="T_41d03_row3_col5" class="data row3 col5" >0.29</td>
          <td id="T_41d03_row3_col6" class="data row3 col6" >0.25</td>
          <td id="T_41d03_row3_col7" class="data row3 col7" >0.76</td>
        </tr>
        <tr>
          <th id="T_41d03_level0_row4" class="row_heading level0 row4" >4</th>
          <td id="T_41d03_row4_col0" class="data row4 col0" >credit</td>
          <td id="T_41d03_row4_col1" class="data row4 col1" >690</td>
          <td id="T_41d03_row4_col2" class="data row4 col2" >15</td>
          <td id="T_41d03_row4_col3" class="data row4 col3" >2</td>
          <td id="T_41d03_row4_col4" class="data row4 col4" >0.14 +/- 0.034</td>
          <td id="T_41d03_row4_col5" class="data row4 col5" >0.2</td>
          <td id="T_41d03_row4_col6" class="data row4 col6" >0.15</td>
          <td id="T_41d03_row4_col7" class="data row4 col7" >0.95</td>
        </tr>
      </tbody>
    </table>

    </div>
    <br />
    <br />

.. GENERATED FROM PYTHON SOURCE LINES 136-139

.. code-block:: default


    r2 = runMRC(phi="fourier", loss="log")
    r2.style.set_caption("Using log loss and fourier feature mapping")


.. raw:: html

    <div class="output_subarea output_html rendered_html output_result">
    <style type="text/css">
    </style>
    <table id="T_55a75">
      <caption>Using log loss and fourier feature mapping</caption>
      <thead>
        <tr>
          <th class="blank level0" >&nbsp;</th>
          <th id="T_55a75_level0_col0" class="col_heading level0 col0" >dataset</th>
          <th id="T_55a75_level0_col1" class="col_heading level0 col1" >n_samples</th>
          <th id="T_55a75_level0_col2" class="col_heading level0 col2" >n_attributes</th>
          <th id="T_55a75_level0_col3" class="col_heading level0 col3" >n_classes</th>
          <th id="T_55a75_level0_col4" class="col_heading level0 col4" >error</th>
          <th id="T_55a75_level0_col5" class="col_heading level0 col5" >upper</th>
          <th id="T_55a75_level0_col6" class="col_heading level0 col6" >lower</th>
          <th id="T_55a75_level0_col7" class="col_heading level0 col7" >avg_train_time (s)</th>
        </tr>
      </thead>
      <tbody>
        <tr>
          <th id="T_55a75_level0_row0" class="row_heading level0 row0" >0</th>
          <td id="T_55a75_row0_col0" class="data row0 col0" >mammographic</td>
          <td id="T_55a75_row0_col1" class="data row0 col1" >961</td>
          <td id="T_55a75_row0_col2" class="data row0 col2" >5</td>
          <td id="T_55a75_row0_col3" class="data row0 col3" >2</td>
          <td id="T_55a75_row0_col4" class="data row0 col4" >0.18 +/- 0.011</td>
          <td id="T_55a75_row0_col5" class="data row0 col5" >0.54</td>
          <td id="T_55a75_row0_col6" class="data row0 col6" >0.44</td>
          <td id="T_55a75_row0_col7" class="data row0 col7" >2.3</td>
        </tr>
        <tr>
          <th id="T_55a75_level0_row1" class="row_heading level0 row1" >1</th>
          <td id="T_55a75_row1_col0" class="data row1 col0" >haberman</td>
          <td id="T_55a75_row1_col1" class="data row1 col1" >306</td>
          <td id="T_55a75_row1_col2" class="data row1 col2" >3</td>
          <td id="T_55a75_row1_col3" class="data row1 col3" >2</td>
          <td id="T_55a75_row1_col4" class="data row1 col4" >0.27 +/- 0.016</td>
          <td id="T_55a75_row1_col5" class="data row1 col5" >0.58</td>
          <td id="T_55a75_row1_col6" class="data row1 col6" >0.5</td>
          <td id="T_55a75_row1_col7" class="data row1 col7" >1.1</td>
        </tr>
        <tr>
          <th id="T_55a75_level0_row2" class="row_heading level0 row2" >2</th>
          <td id="T_55a75_row2_col0" class="data row2 col0" >indian_liver</td>
          <td id="T_55a75_row2_col1" class="data row2 col1" >583</td>
          <td id="T_55a75_row2_col2" class="data row2 col2" >10</td>
          <td id="T_55a75_row2_col3" class="data row2 col3" >2</td>
          <td id="T_55a75_row2_col4" class="data row2 col4" >0.29 +/- 0.0035</td>
          <td id="T_55a75_row2_col5" class="data row2 col5" >0.6</td>
          <td id="T_55a75_row2_col6" class="data row2 col6" >0.59</td>
          <td id="T_55a75_row2_col7" class="data row2 col7" >1.8</td>
        </tr>
        <tr>
          <th id="T_55a75_level0_row3" class="row_heading level0 row3" >3</th>
          <td id="T_55a75_row3_col0" class="data row3 col0" >diabetes</td>
          <td id="T_55a75_row3_col1" class="data row3 col1" >768</td>
          <td id="T_55a75_row3_col2" class="data row3 col2" >8</td>
          <td id="T_55a75_row3_col3" class="data row3 col3" >2</td>
          <td id="T_55a75_row3_col4" class="data row3 col4" >0.24 +/- 0.027</td>
          <td id="T_55a75_row3_col5" class="data row3 col5" >0.6</td>
          <td id="T_55a75_row3_col6" class="data row3 col6" >0.52</td>
          <td id="T_55a75_row3_col7" class="data row3 col7" >2.7</td>
        </tr>
        <tr>
          <th id="T_55a75_level0_row4" class="row_heading level0 row4" >4</th>
          <td id="T_55a75_row4_col0" class="data row4 col0" >credit</td>
          <td id="T_55a75_row4_col1" class="data row4 col1" >690</td>
          <td id="T_55a75_row4_col2" class="data row4 col2" >15</td>
          <td id="T_55a75_row4_col3" class="data row4 col3" >2</td>
          <td id="T_55a75_row4_col4" class="data row4 col4" >0.14 +/- 0.034</td>
          <td id="T_55a75_row4_col5" class="data row4 col5" >0.5</td>
          <td id="T_55a75_row4_col6" class="data row4 col6" >0.39</td>
          <td id="T_55a75_row4_col7" class="data row4 col7" >2.5</td>
        </tr>
      </tbody>
    </table>

    </div>
    <br />
    <br />


.. rst-class:: sphx-glr-timing

   **Total running time of the script:** ( 1 minutes  10.256 seconds)


.. _sphx_glr_download_auto_examples_plot_1_example_mrc.py:

.. only:: html

  .. container:: sphx-glr-footer sphx-glr-footer-example


    .. container:: sphx-glr-download sphx-glr-download-python

      :download:`Download Python source code: plot_1_example_mrc.py <plot_1_example_mrc.py>`

    .. container:: sphx-glr-download sphx-glr-download-jupyter

      :download:`Download Jupyter notebook: plot_1_example_mrc.ipynb <plot_1_example_mrc.ipynb>`


.. only:: html

 .. rst-class:: sphx-glr-signature

    `Gallery generated by Sphinx-Gallery <https://sphinx-gallery.github.io>`_