From 752871dd0cff14aecb1266848bd81f01cde38975 Mon Sep 17 00:00:00 2001
From: olasaadi <92303887+olasaadi@users.noreply.github.com>
Date: Wed, 23 Feb 2022 14:57:12 +0200
Subject: [PATCH 01/26] add minimization notebook (#22)

* add german credit notebook to showcase new features (minimize only some features and categorical features)

* add notebook to show minimization data on a regression problem
---
 notebooks/minimization_diabetes_reg.ipynb  | 262 ++++++++++++++
 notebooks/minimization_german_credit.ipynb | 385 +++++++++++++++++++++
 tests/test_minimizer.py                    |   2 +-
 3 files changed, 648 insertions(+), 1 deletion(-)
 create mode 100644 notebooks/minimization_diabetes_reg.ipynb
 create mode 100644 notebooks/minimization_german_credit.ipynb

diff --git a/notebooks/minimization_diabetes_reg.ipynb b/notebooks/minimization_diabetes_reg.ipynb
new file mode 100644
index 0000000..597d77a
--- /dev/null
+++ b/notebooks/minimization_diabetes_reg.ipynb
@@ -0,0 +1,262 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "collapsed": true,
+    "pycharm": {
+     "name": "#%% md\n"
+    }
+   },
+   "source": [
+    "# Applying data minimization to a trained regression ML model"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "source": [
+    "In this tutorial we will show how to perform data minimization for regression ML models using the minimization module.\n",
+    "\n",
+    "We will show you applying data minimization to a different trained regression models."
+   ],
+   "metadata": {
+    "collapsed": false
+   }
+  },
+  {
+   "cell_type": "markdown",
+   "source": [
+    "## Load data\n",
+    "QI parameter determines which features will be minimized."
+   ],
+   "metadata": {
+    "collapsed": false,
+    "pycharm": {
+     "name": "#%% md\n"
+    }
+   }
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 54,
+   "outputs": [],
+   "source": [
+    "from sklearn.datasets import load_diabetes\n",
+    "from sklearn.model_selection import train_test_split\n",
+    "\n",
+    "dataset = load_diabetes()\n",
+    "X_train, X_test, y_train, y_test = train_test_split(dataset.data, dataset.target, test_size=0.5, random_state=14)\n",
+    "\n",
+    "features = ['age', 'sex', 'bmi', 'bp',\n",
+    "                's1', 's2', 's3', 's4', 's5', 's6']\n",
+    "QI = [0, 2, 5, 8, 9]"
+   ],
+   "metadata": {
+    "collapsed": false,
+    "pycharm": {
+     "name": "#%%\n"
+    }
+   }
+  },
+  {
+   "cell_type": "markdown",
+   "source": [
+    "## Train DecisionTreeRegressor model"
+   ],
+   "metadata": {
+    "collapsed": false
+   }
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 55,
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Base model accuracy (R2 score):  0.15014421352446072\n"
+     ]
+    }
+   ],
+   "source": [
+    "from apt.minimization import GeneralizeToRepresentative\n",
+    "from sklearn.tree import DecisionTreeRegressor\n",
+    "\n",
+    "model1 = DecisionTreeRegressor(random_state=10, min_samples_split=2)\n",
+    "model1.fit(X_train, y_train)\n",
+    "print('Base model accuracy (R2 score): ', model1.score(X_test, y_test))"
+   ],
+   "metadata": {
+    "collapsed": false,
+    "pycharm": {
+     "name": "#%%\n"
+    }
+   }
+  },
+  {
+   "cell_type": "markdown",
+   "source": [
+    "## Run minimization\n",
+    "We will try to run minimization with only a subset of the features."
+   ],
+   "metadata": {
+    "collapsed": false
+   }
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 56,
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Initial accuracy of model on generalized data, relative to original model predictions (base generalization derived from tree, before improvements): 0.108922\n",
+      "Improving accuracy\n",
+      "feature to remove: s5\n",
+      "Removed feature: s5, new relative accuracy: 0.505498\n",
+      "feature to remove: s6\n",
+      "Removed feature: s6, new relative accuracy: 0.404757\n",
+      "feature to remove: bmi\n",
+      "Removed feature: bmi, new relative accuracy: 0.718978\n",
+      "Accuracy on minimized data:  0.11604533946025941\n",
+      "generalizations:  {'ranges': {'age': [-0.07090024650096893, -0.043656209483742714, -0.041839939542114735, -0.03639113181270659, -0.01459590089507401, -0.012779632292222232, -0.009147093165665865, -0.0036982858437113464, 0.03989217430353165, 0.039892176166176796, 0.05623859912157059, 0.06713621318340302], 's2': [-0.0550188384950161, -0.0285577941685915, -0.024643437936902046, -0.02135537937283516, -0.013683241792023182, -0.006480826530605555, 0.009176596067845821, 0.023111702874302864, 0.02420772146433592, 0.02655633445829153, 0.039082273840904236]}, 'categories': {}, 'untouched': ['s3', 'bmi', 's6', 'bp', 's4', 's5', 'sex', 's1']}\n"
+     ]
+    }
+   ],
+   "source": [
+    "# note that is_regression param is True\n",
+    "\n",
+    "minimizer1 = GeneralizeToRepresentative(model1, target_accuracy=0.7, features=features, is_regression=True,\n",
+    "                                    features_to_minimize=QI)\n",
+    "\n",
+    "# Fitting the minimizar can be done either on training or test data. Doing it with test data is better as the\n",
+    "# resulting accuracy on test data will be closer to the desired target accuracy (when working with training\n",
+    "# data it could result in a larger gap)\n",
+    "# Don't forget to leave a hold-out set for final validation!\n",
+    "X_generalizer_train1, x_test1, y_generalizer_train1, y_test1 = train_test_split(X_test, y_test,\n",
+    "                                                                test_size = 0.4, random_state = 38)\n",
+    "\n",
+    "x_train_predictions1 = model1.predict(X_generalizer_train1)\n",
+    "minimizer1.fit(X_generalizer_train1, x_train_predictions1)\n",
+    "transformed1 = minimizer1.transform(x_test1)\n",
+    "print('Accuracy on minimized data: ', model1.score(transformed1, y_test1))\n",
+    "print('generalizations: ',minimizer1.generalizations_)#%% md"
+   ],
+   "metadata": {
+    "collapsed": false,
+    "pycharm": {
+     "name": "#%%\n"
+    }
+   }
+  },
+  {
+   "cell_type": "markdown",
+   "source": [
+    "## Train linear regression model"
+   ],
+   "metadata": {
+    "collapsed": false,
+    "pycharm": {
+     "name": "#%% md\n"
+    }
+   }
+  },
+  {
+   "cell_type": "code",
+   "source": [
+    "from sklearn.linear_model import LinearRegression\n",
+    "from apt.minimization import GeneralizeToRepresentative\n",
+    "\n",
+    "model2 = LinearRegression()\n",
+    "model2.fit(X_train, y_train)\n",
+    "print('Base model accuracy (R2 score): ', model2.score(X_test, y_test))"
+   ],
+   "metadata": {
+    "collapsed": false,
+    "pycharm": {
+     "name": "#%%\n"
+    }
+   },
+   "execution_count": null,
+   "outputs": []
+  },
+  {
+   "cell_type": "markdown",
+   "source": [
+    "## Run minimization\n",
+    "We will try to run minimization with only a subset of the features."
+   ],
+   "metadata": {
+    "collapsed": false
+   }
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 58,
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Initial accuracy of model on generalized data, relative to original model predictions (base generalization derived from tree, before improvements): 0.225782\n",
+      "Improving accuracy\n",
+      "feature to remove: age\n",
+      "Removed feature: age, new relative accuracy: 0.223565\n",
+      "feature to remove: s2\n",
+      "Removed feature: s2, new relative accuracy: 0.759788\n",
+      "Accuracy on minimized data:  0.4414329261774286\n",
+      "generalizations:  {'ranges': {'bmi': [-0.0660245232284069, -0.06171327643096447, -0.048779530450701714, -0.036923596635460854, -0.022912041284143925, -0.015906263142824173, -0.009978296235203743, 0.007266696775332093, 0.022356065921485424, 0.028822937980294228, 0.04499012045562267, 0.053073709830641747, 0.10103634744882584], 's5': [-0.08940735459327698, -0.07823517918586731, -0.07310866191983223, -0.07022909820079803, -0.06740894541144371, -0.06558558344841003, -0.041897499933838844, -0.04049498960375786, -0.03781316243112087, -0.033939776942133904, -0.03263746201992035, -0.02538660168647766, -0.023219254799187183, -0.017585186287760735, -0.016525186598300934, -0.008522996446117759, 0.0015758189256303012, 0.012934560421854258, 0.014069339726120234, 0.015929921995848417, 0.01947084255516529, 0.028651678003370762, 0.03358383011072874, 0.03639278281480074, 0.041416410356760025, 0.06386702693998814], 's6': [-0.07356456853449345, -0.052854035049676895, -0.048711927607655525, -0.0383566590026021, -0.02800139266764745, -0.021788232028484344, -0.007290858076885343, -0.007290857844054699, 0.017561784014105797, 0.02377494378015399, 0.02791705122217536, 0.02998810407007113, 0.054840744473040104]}, 'categories': {}, 'untouched': ['s2', 's3', 'bp', 's4', 'age', 'sex', 's1']}\n"
+     ]
+    }
+   ],
+   "source": [
+    "# note that is_regression param is True\n",
+    "\n",
+    "minimizer2 = GeneralizeToRepresentative(model2, target_accuracy=0.7, features=features, is_regression=True,\n",
+    "                                    features_to_minimize=QI)\n",
+    "\n",
+    "# Fitting the minimizar can be done either on training or test data. Doing it with test data is better as the\n",
+    "# resulting accuracy on test data will be closer to the desired target accuracy (when working with training\n",
+    "# data it could result in a larger gap)\n",
+    "# Don't forget to leave a hold-out set for final validation!\n",
+    "X_generalizer_train2, x_test2, y_generalizer_train2, y_test2 = train_test_split(X_test, y_test,\n",
+    "                                                                test_size = 0.4, random_state = 38)\n",
+    "\n",
+    "x_train_predictions2 = model2.predict(X_generalizer_train2)\n",
+    "minimizer2.fit(X_generalizer_train2, x_train_predictions2)\n",
+    "transformed2 = minimizer2.transform(x_test2)\n",
+    "print('Accuracy on minimized data: ', model2.score(transformed2, y_test2))\n",
+    "print('generalizations: ',minimizer2.generalizations_)"
+   ],
+   "metadata": {
+    "collapsed": false,
+    "pycharm": {
+     "name": "#%%\n"
+    }
+   }
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 2
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython2",
+   "version": "2.7.6"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 0
+}
\ No newline at end of file
diff --git a/notebooks/minimization_german_credit.ipynb b/notebooks/minimization_german_credit.ipynb
new file mode 100644
index 0000000..03af5f0
--- /dev/null
+++ b/notebooks/minimization_german_credit.ipynb
@@ -0,0 +1,385 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "source": [
+    "# Applying data minimization with categorical data and only a subset of the features to a trained ML model"
+   ],
+   "metadata": {
+    "collapsed": false
+   }
+  },
+  {
+   "cell_type": "markdown",
+   "source": [
+    "In this tutorial we will show how to perform data minimization for ML models using the minimization module.\n",
+    "\n",
+    "This will be demonstarted using the German Credit dataset (original dataset can be found here: https://archive.ics.uci.edu/ml/machine-learning-databases/statlog/german/german.data)."
+   ],
+   "metadata": {
+    "collapsed": false
+   }
+  },
+  {
+   "cell_type": "markdown",
+   "source": [
+    "## Load data\n",
+    "QI parameter determines which features will be minimized."
+   ],
+   "metadata": {
+    "collapsed": false
+   }
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "    Existing_checking_account  Duration_in_month Credit_history Purpose  \\\n",
+      "0                         A14                 24            A32     A41   \n",
+      "1                         A14                 33            A33     A49   \n",
+      "2                         A11                  9            A32     A42   \n",
+      "3                         A14                 28            A34     A43   \n",
+      "4                         A11                 24            A33     A43   \n",
+      "..                        ...                ...            ...     ...   \n",
+      "695                       A14                 12            A32     A43   \n",
+      "696                       A14                 13            A32     A43   \n",
+      "697                       A11                 48            A30     A41   \n",
+      "698                       A12                 21            A34     A42   \n",
+      "699                       A13                 15            A32     A46   \n",
+      "\n",
+      "     Credit_amount Savings_account Present_employment_since  Installment_rate  \\\n",
+      "0             7814             A61                      A74                 3   \n",
+      "1             2764             A61                      A73                 2   \n",
+      "2             2136             A61                      A73                 3   \n",
+      "3             2743             A61                      A75                 4   \n",
+      "4             1659             A61                      A72                 4   \n",
+      "..             ...             ...                      ...               ...   \n",
+      "695           1963             A61                      A74                 4   \n",
+      "696           1409             A62                      A71                 2   \n",
+      "697           4605             A61                      A75                 3   \n",
+      "698           2745             A64                      A74                 3   \n",
+      "699           1905             A61                      A75                 4   \n",
+      "\n",
+      "    Personal_status_sex debtors  Present_residence Property  Age  \\\n",
+      "0                   A93    A101                  3     A123   38   \n",
+      "1                   A92    A101                  2     A123   26   \n",
+      "2                   A93    A101                  2     A121   25   \n",
+      "3                   A93    A101                  2     A123   29   \n",
+      "4                   A92    A101                  2     A123   29   \n",
+      "..                  ...     ...                ...      ...  ...   \n",
+      "695                 A93    A101                  2     A123   31   \n",
+      "696                 A92    A101                  4     A121   64   \n",
+      "697                 A93    A101                  4     A124   24   \n",
+      "698                 A93    A101                  2     A123   32   \n",
+      "699                 A93    A101                  4     A123   40   \n",
+      "\n",
+      "    Other_installment_plans Housing  Number_of_existing_credits   Job  \\\n",
+      "0                      A143    A152                           1  A174   \n",
+      "1                      A143    A152                           2  A173   \n",
+      "2                      A143    A152                           1  A173   \n",
+      "3                      A143    A152                           2  A173   \n",
+      "4                      A143    A151                           1  A172   \n",
+      "..                      ...     ...                         ...   ...   \n",
+      "695                    A143    A151                           2  A174   \n",
+      "696                    A143    A152                           1  A173   \n",
+      "697                    A143    A153                           2  A173   \n",
+      "698                    A143    A152                           2  A173   \n",
+      "699                    A143    A151                           1  A174   \n",
+      "\n",
+      "     N_people_being_liable_provide_maintenance  Telephone  Foreign_worker  \n",
+      "0                                            1          1               1  \n",
+      "1                                            1          1               1  \n",
+      "2                                            1          0               1  \n",
+      "3                                            1          0               1  \n",
+      "4                                            1          1               1  \n",
+      "..                                         ...        ...             ...  \n",
+      "695                                          2          1               1  \n",
+      "696                                          1          0               1  \n",
+      "697                                          2          0               1  \n",
+      "698                                          1          1               1  \n",
+      "699                                          1          1               1  \n",
+      "\n",
+      "[700 rows x 20 columns]\n"
+     ]
+    }
+   ],
+   "source": [
+    "from apt.utils import get_german_credit_dataset\n",
+    "\n",
+    "(x_train, y_train), (x_test, y_test) = get_german_credit_dataset()\n",
+    "features = [\"Existing_checking_account\", \"Duration_in_month\", \"Credit_history\", \"Purpose\", \"Credit_amount\",\n",
+    "                \"Savings_account\", \"Present_employment_since\", \"Installment_rate\", \"Personal_status_sex\", \"debtors\",\n",
+    "                \"Present_residence\", \"Property\", \"Age\", \"Other_installment_plans\", \"Housing\",\n",
+    "                \"Number_of_existing_credits\", \"Job\", \"N_people_being_liable_provide_maintenance\", \"Telephone\",\n",
+    "                \"Foreign_worker\"]\n",
+    "categorical_features = [\"Existing_checking_account\", \"Credit_history\", \"Purpose\", \"Savings_account\",\n",
+    "                        \"Present_employment_since\", \"Personal_status_sex\", \"debtors\", \"Property\",\n",
+    "                        \"Other_installment_plans\", \"Housing\", \"Job\"]\n",
+    "QI = [\"Duration_in_month\", \"Credit_history\", \"Purpose\", \"debtors\", \"Property\", \"Other_installment_plans\",\n",
+    "      \"Housing\", \"Job\"]\n",
+    "\n",
+    "print(x_train)"
+   ],
+   "metadata": {
+    "collapsed": false,
+    "pycharm": {
+     "name": "#%%\n"
+    }
+   }
+  },
+  {
+   "cell_type": "markdown",
+   "source": [
+    "## Train decision tree model\n",
+    "we use OneHotEncoder to handle categorical features."
+   ],
+   "metadata": {
+    "collapsed": false
+   }
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Base model accuracy:  0.7033333333333334\n"
+     ]
+    }
+   ],
+   "source": [
+    "from sklearn.compose import ColumnTransformer\n",
+    "from sklearn.preprocessing import OneHotEncoder\n",
+    "from sklearn.impute import SimpleImputer\n",
+    "from sklearn.pipeline import Pipeline\n",
+    "from sklearn.tree import DecisionTreeClassifier\n",
+    "numeric_features = [f for f in features if f not in categorical_features]\n",
+    "numeric_transformer = Pipeline(\n",
+    "    steps=[('imputer', SimpleImputer(strategy='constant', fill_value=0))]\n",
+    ")\n",
+    "categorical_transformer = OneHotEncoder(handle_unknown=\"ignore\", sparse=False)\n",
+    "preprocessor = ColumnTransformer(\n",
+    "    transformers=[\n",
+    "        (\"num\", numeric_transformer, numeric_features),\n",
+    "        (\"cat\", categorical_transformer, categorical_features),\n",
+    "    ]\n",
+    ")\n",
+    "encoded_train = preprocessor.fit_transform(x_train)\n",
+    "model = DecisionTreeClassifier()\n",
+    "model.fit(encoded_train, y_train)\n",
+    "\n",
+    "encoded_test = preprocessor.transform(x_test)\n",
+    "print('Base model accuracy: ', model.score(encoded_test, y_test))"
+   ],
+   "metadata": {
+    "collapsed": false,
+    "pycharm": {
+     "name": "#%%\n"
+    }
+   }
+  },
+  {
+   "cell_type": "markdown",
+   "source": [
+    "## Run minimization\n",
+    "We will try to run minimization with categorical features and only a subset of the features with different possible values of target accuracy (how close to the original model's accuracy we want to get, 1 being same accuracy as for original data)."
+   ],
+   "metadata": {
+    "collapsed": false
+   }
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Initial accuracy of model on generalized data, relative to original model predictions (base generalization derived from tree, before improvements): 0.791667\n",
+      "Improving accuracy\n",
+      "feature to remove: Property\n",
+      "Removed feature: Property, new relative accuracy: 0.819444\n",
+      "feature to remove: Other_installment_plans\n",
+      "Removed feature: Other_installment_plans, new relative accuracy: 0.833333\n",
+      "feature to remove: Job\n",
+      "Removed feature: Job, new relative accuracy: 0.833333\n",
+      "feature to remove: Housing\n",
+      "Removed feature: Housing, new relative accuracy: 0.833333\n",
+      "feature to remove: Purpose\n",
+      "Removed feature: Purpose, new relative accuracy: 0.916667\n",
+      "feature to remove: Credit_history\n",
+      "Removed feature: Credit_history, new relative accuracy: 0.930556\n",
+      "feature to remove: debtors\n",
+      "Removed feature: debtors, new relative accuracy: 0.944444\n",
+      "feature to remove: Duration_in_month\n",
+      "Removed feature: Duration_in_month, new relative accuracy: 1.000000\n",
+      "Accuracy on minimized data:  0.6666666666666666\n"
+     ]
+    }
+   ],
+   "source": [
+    "import sys\n",
+    "import os\n",
+    "sys.path.insert(0, os.path.abspath('..'))\n",
+    "\n",
+    "from apt.minimization import GeneralizeToRepresentative\n",
+    "from sklearn.model_selection import train_test_split\n",
+    "\n",
+    "# default target_accuracy is 0.998\n",
+    "minimizer = GeneralizeToRepresentative(model, features=features,\n",
+    "                                     categorical_features=categorical_features, features_to_minimize=QI)\n",
+    "\n",
+    "# Fitting the minimizar can be done either on training or test data. Doing it with test data is better as the\n",
+    "# resulting accuracy on test data will be closer to the desired target accuracy (when working with training\n",
+    "# data it could result in a larger gap)\n",
+    "# Don't forget to leave a hold-out set for final validation!\n",
+    "X_generalizer_train, x_test, y_generalizer_train, y_test = train_test_split(x_test, y_test, stratify=y_test,\n",
+    "                                                                test_size = 0.4, random_state = 38)\n",
+    "X_generalizer_train.reset_index(drop=True, inplace=True)\n",
+    "y_generalizer_train.reset_index(drop=True, inplace=True)\n",
+    "x_test.reset_index(drop=True, inplace=True)\n",
+    "y_test.reset_index(drop=True, inplace=True)\n",
+    "encoded_generalizer_train = preprocessor.transform(X_generalizer_train)\n",
+    "x_train_predictions = model.predict(encoded_generalizer_train)\n",
+    "minimizer.fit(X_generalizer_train, x_train_predictions)\n",
+    "transformed = minimizer.transform(x_test)\n",
+    "\n",
+    "encoded_transformed = preprocessor.transform(transformed)\n",
+    "print('Accuracy on minimized data: ', model.score(encoded_transformed, y_test))"
+   ],
+   "metadata": {
+    "collapsed": false,
+    "pycharm": {
+     "name": "#%%\n"
+    }
+   }
+  },
+  {
+   "cell_type": "markdown",
+   "source": [
+    "#### Let's see what features were generalized"
+   ],
+   "metadata": {
+    "collapsed": false
+   }
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "{'ranges': {}, 'categories': {}, 'untouched': ['Purpose', 'Present_residence', 'Credit_history', 'Telephone', 'Job', 'Housing', 'Installment_rate', 'Number_of_existing_credits', 'Foreign_worker', 'Existing_checking_account', 'Other_installment_plans', 'N_people_being_liable_provide_maintenance', 'Property', 'Savings_account', 'Present_employment_since', 'Personal_status_sex', 'Duration_in_month', 'debtors', 'Credit_amount', 'Age']}\n"
+     ]
+    }
+   ],
+   "source": [
+    "generalizations = minimizer.generalizations\n",
+    "print(generalizations)"
+   ],
+   "metadata": {
+    "collapsed": false,
+    "pycharm": {
+     "name": "#%%\n"
+    }
+   }
+  },
+  {
+   "cell_type": "markdown",
+   "source": [
+    "We can see that for the default target accuracy of 0.998 of the original accuracy, no generalizations are possible (all features are left untouched, i.e., not generalized).\n",
+    "\n",
+    "Let's change to a slightly lower target accuracy."
+   ],
+   "metadata": {
+    "collapsed": false
+   }
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 5,
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Initial accuracy of model on generalized data, relative to original model predictions (base generalization derived from tree, before improvements): 0.791667\n",
+      "Improving accuracy\n",
+      "feature to remove: Property\n",
+      "Removed feature: Property, new relative accuracy: 0.819444\n",
+      "feature to remove: Other_installment_plans\n",
+      "Removed feature: Other_installment_plans, new relative accuracy: 0.833333\n",
+      "feature to remove: Job\n",
+      "Removed feature: Job, new relative accuracy: 0.833333\n",
+      "feature to remove: Housing\n",
+      "Removed feature: Housing, new relative accuracy: 0.833333\n",
+      "feature to remove: Purpose\n",
+      "Removed feature: Purpose, new relative accuracy: 0.916667\n",
+      "feature to remove: Credit_history\n",
+      "Removed feature: Credit_history, new relative accuracy: 0.930556\n",
+      "Accuracy on minimized data:  0.6416666666666667\n",
+      "{'ranges': {'Duration_in_month': [7.0, 8.5, 11.0, 13.0, 14.0, 18.0, 23.0, 25.5, 34.5, 47.5]}, 'categories': {'debtors': [['A101', 'A102'], ['A103']]}, 'untouched': ['Existing_checking_account', 'Savings_account', 'Present_employment_since', 'Property', 'Housing', 'Purpose', 'Personal_status_sex', 'Present_residence', 'Credit_history', 'Telephone', 'Installment_rate', 'Other_installment_plans', 'Number_of_existing_credits', 'Credit_amount', 'N_people_being_liable_provide_maintenance', 'Foreign_worker', 'Age', 'Job']}\n"
+     ]
+    }
+   ],
+   "source": [
+    "# We allow a 1% deviation in accuracy from the original model accuracy\n",
+    "minimizer2 = GeneralizeToRepresentative(model, target_accuracy=0.92, features=features,\n",
+    "                                     categorical_features=categorical_features, features_to_minimize=QI)\n",
+    "\n",
+    "minimizer2.fit(X_generalizer_train, x_train_predictions)\n",
+    "transformed2 = minimizer2.transform(x_test)\n",
+    "\n",
+    "encoded_transformed2 = preprocessor.transform(transformed2)\n",
+    "print('Accuracy on minimized data: ', model.score(encoded_transformed2, y_test))\n",
+    "generalizations2 = minimizer2.generalizations\n",
+    "print(generalizations2)"
+   ],
+   "metadata": {
+    "collapsed": false,
+    "pycharm": {
+     "name": "#%%\n"
+    }
+   }
+  },
+  {
+   "cell_type": "markdown",
+   "source": [
+    "This time we were able to generalize two features (Duration_in_month and debtors)."
+   ],
+   "metadata": {
+    "collapsed": false
+   }
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 2
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython2",
+   "version": "2.7.6"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 0
+}
\ No newline at end of file
diff --git a/tests/test_minimizer.py b/tests/test_minimizer.py
index 3ed7fa6..e6f50be 100644
--- a/tests/test_minimizer.py
+++ b/tests/test_minimizer.py
@@ -510,7 +510,7 @@ def test_regression():
     transformed = gen.transform(x_train)
     print('Base model accuracy (R2 score): ', model.score(x_test, y_test))
     model.fit(transformed, y_train)
-    print('Base model accuracy (R2 score) after anonymization: ', model.score(x_test, y_test))
+    print('Base model accuracy (R2 score) after minimization: ', model.score(x_test, y_test))
     gener = gen.generalizations_
     expexted_generalizations = {'ranges': {
         'age': [-0.07816532626748085, -0.07090024650096893, -0.05637009255588055, -0.05092128552496433,

From 7fbd1e4b904909d8440414f81de49e51e640be2d Mon Sep 17 00:00:00 2001
From: abigailt <abigailt@il.ibm.com>
Date: Wed, 23 Feb 2022 19:22:54 +0200
Subject: [PATCH 02/26] Update version and docs

---
 apt/__init__.py              |  2 +-
 apt/minimization/__init__.py |  3 ---
 docs/conf.py                 |  2 +-
 docs/source/tests.rst        | 30 ------------------------------
 setup.cfg                    |  2 +-
 5 files changed, 3 insertions(+), 36 deletions(-)
 delete mode 100644 docs/source/tests.rst

diff --git a/apt/__init__.py b/apt/__init__.py
index 99e5ad6..ea6178a 100644
--- a/apt/__init__.py
+++ b/apt/__init__.py
@@ -6,4 +6,4 @@ from apt import anonymization
 from apt import minimization
 from apt import utils
 
-__version__ = "0.0.3"
\ No newline at end of file
+__version__ = "0.0.4"
\ No newline at end of file
diff --git a/apt/minimization/__init__.py b/apt/minimization/__init__.py
index e9aa35d..10d0a57 100644
--- a/apt/minimization/__init__.py
+++ b/apt/minimization/__init__.py
@@ -12,8 +12,5 @@ them to new data.
 
 It is also possible to export the generalizations as feature ranges.
 
-The current implementation supports only numeric features, so any categorical features must be transformed to a numeric
-representation before using this class.
-
 """
 from apt.minimization.minimizer import GeneralizeToRepresentative
diff --git a/docs/conf.py b/docs/conf.py
index 0b26b58..36cdd76 100644
--- a/docs/conf.py
+++ b/docs/conf.py
@@ -22,7 +22,7 @@ copyright = '2021, IBM'
 author = 'Abigail Goldsteen'
 
 # The full version, including alpha/beta/rc tags
-release = '0.0.3'
+release = '0.0.4'
 
 master_doc = 'index'
 
diff --git a/docs/source/tests.rst b/docs/source/tests.rst
deleted file mode 100644
index b1428e0..0000000
--- a/docs/source/tests.rst
+++ /dev/null
@@ -1,30 +0,0 @@
-tests package
-=============
-
-Submodules
-----------
-
-tests.test\_anonymizer module
------------------------------
-
-.. automodule:: tests.test_anonymizer
-    :members:
-    :undoc-members:
-    :show-inheritance:
-
-tests.test\_minimizer module
-----------------------------
-
-.. automodule:: tests.test_minimizer
-    :members:
-    :undoc-members:
-    :show-inheritance:
-
-
-Module contents
----------------
-
-.. automodule:: tests
-    :members:
-    :undoc-members:
-    :show-inheritance:
diff --git a/setup.cfg b/setup.cfg
index f82cdb6..2e79a5f 100644
--- a/setup.cfg
+++ b/setup.cfg
@@ -1,7 +1,7 @@
 [metadata]
 # replace with your username:
 name = ai-privacy-toolkit
-version = 0.0.3
+version = 0.0.4
 author = Abigail Goldsteen
 author_email = abigailt@il.ibm.com
 description = A toolkit for tools and techniques related to the privacy and compliance of AI models.

From c47819a0316418b186c2a2a88121e60b5f6298f6 Mon Sep 17 00:00:00 2001
From: abigailt <abigailt@il.ibm.com>
Date: Wed, 23 Feb 2022 19:40:11 +0200
Subject: [PATCH 03/26] Update docs

---
 apt/anonymization/anonymizer.py | 24 +++++++++++++++---------
 apt/minimization/minimizer.py   |  5 +++--
 apt/utils.py                    |  5 +++--
 3 files changed, 21 insertions(+), 13 deletions(-)

diff --git a/apt/anonymization/anonymizer.py b/apt/anonymization/anonymizer.py
index d7b1c88..c3bbdb9 100644
--- a/apt/anonymization/anonymizer.py
+++ b/apt/anonymization/anonymizer.py
@@ -14,19 +14,25 @@ class Anonymize:
     Class for performing tailored, model-guided anonymization of training datasets for ML models.
 
     Based on the implementation described in: https://arxiv.org/abs/2007.13086
+
+    Parameters
+    ----------
+    k : int
+        The privacy parameter that determines the number of records that will be indistinguishable from each
+        other (when looking at the quasi identifiers). Should be at least 2.
+    quasi_identifiers : np.ndarray or list
+        The features that need to be minimized in case of pandas data, and indexes of features
+        in case of numpy data.
+    categorical_features : list, optional
+        The list of categorical features (should only be supplied when passing data as a
+        pandas dataframe.
+    is_regression : Bool, optional
+        Whether the model is a regression model or not (if False, assumes
+        a classification model). Default is False.
     """
 
     def __init__(self, k: int, quasi_identifiers: Union[np.ndarray, list], categorical_features: Optional[list] = None,
                  is_regression=False):
-        """
-        :param k: The privacy parameter that determines the number of records that will be indistinguishable from each
-                  other (when looking at the quasi identifiers). Should be at least 2.
-        :param quasi_identifiers: The features that need to be minimized in case of pandas data, and indexes of features
-                                  in case of numpy data.
-        :param categorical_features: The list of categorical features (should only be supplied when passing data as a
-                                     pandas dataframe.
-        :param is_regression: Boolean param indicates that is is a regression problem.
-        """
         if k < 2:
             raise ValueError("k should be a positive integer with a value of 2 or higher")
         if quasi_identifiers is None or len(quasi_identifiers) < 1:
diff --git a/apt/minimization/minimizer.py b/apt/minimization/minimizer.py
index da31b3e..d04cc03 100644
--- a/apt/minimization/minimizer.py
+++ b/apt/minimization/minimizer.py
@@ -39,12 +39,10 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
     estimator : estimator, optional
         The original model for which generalization is being performed.
         Should be pre-fitted.
-
     target_accuracy : float, optional
         The required accuracy when applying the base model to the
         generalized data. Accuracy is measured relative to the original
         accuracy of the model.
-
     features : list of str, optional
         The feature names, in the order that they appear in the data.
     categorical_features: list of str, optional
@@ -63,6 +61,9 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
         The required method to train data set for minimizing. Default is
         to train the tree just on the features that are given as
         features_to_minimize.
+    is_regression : Bool, optional
+        Whether the model is a regression model or not (if False, assumes
+        a classification model). Default is False.
 
     Attributes
     ----------
diff --git a/apt/utils.py b/apt/utils.py
index 005c45b..bc73cbc 100644
--- a/apt/utils.py
+++ b/apt/utils.py
@@ -19,20 +19,21 @@ def _load_iris(test_set_size: float = 0.3):
     return (x_train, y_train), (x_test, y_test)
 
 
-def get_iris_dataset():
+def get_iris_dataset(test_set: float = 0.3):
     """
     Loads the Iris dataset from scikit-learn.
 
     :param test_set: Proportion of the data to use as validation split (value between 0 and 1).
     :return: Entire dataset and labels as numpy array.
     """
-    return _load_iris()
+    return _load_iris(test_set)
 
 
 def get_german_credit_dataset(test_set: float = 0.3):
     """
     Loads the UCI German_credit dataset from `tests/datasets/german` or downloads it if necessary.
 
+    :param test_set: Proportion of the data to use as validation split (value between 0 and 1).
     :return: Dataset and labels as pandas dataframes.
     """
 

From d53818644e7a46edf02338d0837cc63c776204ef Mon Sep 17 00:00:00 2001
From: olasaadi <92303887+olasaadi@users.noreply.github.com>
Date: Mon, 7 Mar 2022 20:12:55 +0200
Subject: [PATCH 04/26] Build the dt on all features anon (#23)

* add param to build the DT on all features and not just on QI
* one-hot encoding only for categorical features
---
 apt/anonymization/anonymizer.py | 42 +++++++++++++++++++++----
 tests/test_anonymizer.py        | 54 ++++++++++++++++++++++++++-------
 2 files changed, 79 insertions(+), 17 deletions(-)

diff --git a/apt/anonymization/anonymizer.py b/apt/anonymization/anonymizer.py
index c3bbdb9..9f82c7c 100644
--- a/apt/anonymization/anonymizer.py
+++ b/apt/anonymization/anonymizer.py
@@ -3,6 +3,9 @@ import pandas as pd
 from scipy.spatial import distance
 from collections import Counter
 
+from sklearn.compose import ColumnTransformer
+from sklearn.impute import SimpleImputer
+from sklearn.pipeline import Pipeline
 from sklearn.tree import DecisionTreeClassifier, DecisionTreeRegressor
 from sklearn.preprocessing import OneHotEncoder
 
@@ -29,10 +32,13 @@ class Anonymize:
     is_regression : Bool, optional
         Whether the model is a regression model or not (if False, assumes
         a classification model). Default is False.
+    train_only_QI : Bool, optional
+        The required method to train data set for anonymization. Default is
+        to train the tree on all features.
     """
 
     def __init__(self, k: int, quasi_identifiers: Union[np.ndarray, list], categorical_features: Optional[list] = None,
-                 is_regression=False):
+                 is_regression=False, train_only_QI=False):
         if k < 2:
             raise ValueError("k should be a positive integer with a value of 2 or higher")
         if quasi_identifiers is None or len(quasi_identifiers) < 1:
@@ -42,6 +48,7 @@ class Anonymize:
         self.quasi_identifiers = quasi_identifiers
         self.categorical_features = categorical_features
         self.is_regression = is_regression
+        self.train_only_QI = train_only_QI
 
     def anonymize(self, x: Union[np.ndarray, pd.DataFrame], y: Union[np.ndarray, pd.DataFrame]) \
             -> Union[np.ndarray, pd.DataFrame]:
@@ -54,8 +61,10 @@ class Anonymize:
         :return: An array containing the anonymized training dataset.
         """
         if type(x) == np.ndarray:
+            self.features = [i for i in range(x.shape[1])]
             return self._anonymize_ndarray(x.copy(), y)
         else:  # pandas
+            self.features = x.columns
             if not self.categorical_features:
                 raise ValueError('When supplying a pandas dataframe, categorical_features must be defined')
             return self._anonymize_pandas(x.copy(), y)
@@ -63,7 +72,10 @@ class Anonymize:
     def _anonymize_ndarray(self, x, y):
         if x.shape[0] != y.shape[0]:
             raise ValueError("x and y should have same number of rows")
-        x_anonymizer_train = x[:, self.quasi_identifiers]
+        x_anonymizer_train = x
+        if self.train_only_QI:
+            # build DT just on QI features
+            x_anonymizer_train = x[:, self.quasi_identifiers]
         if x.dtype.kind not in 'iufc':
             x_prepared = self._modify_categorical_features(x_anonymizer_train)
         else:
@@ -79,7 +91,10 @@ class Anonymize:
     def _anonymize_pandas(self, x, y):
         if x.shape[0] != y.shape[0]:
             raise ValueError("x and y should have same number of rows")
-        x_anonymizer_train = x.loc[:, self.quasi_identifiers]
+        x_anonymizer_train = x
+        if self.train_only_QI:
+            # build DT just on QI features
+            x_anonymizer_train = x.loc[:, self.quasi_identifiers]
         # need to one-hot encode before training the decision tree
         x_prepared = self._modify_categorical_features(x_anonymizer_train)
         if self.is_regression:
@@ -169,6 +184,21 @@ class Anonymize:
         return x
 
     def _modify_categorical_features(self, x):
-        encoder = OneHotEncoder()
-        one_hot_encoded = encoder.fit_transform(x)
-        return one_hot_encoded
+        # prepare data for DT
+        used_features = self.features
+        if self.train_only_QI:
+            used_features = self.quasi_identifiers
+        numeric_features = [f for f in x.columns if f in used_features and f not in self.categorical_features]
+        categorical_features = [f for f in self.categorical_features if f in used_features]
+        numeric_transformer = Pipeline(
+            steps=[('imputer', SimpleImputer(strategy='constant', fill_value=0))]
+        )
+        categorical_transformer = OneHotEncoder(handle_unknown="ignore", sparse=False)
+        preprocessor = ColumnTransformer(
+            transformers=[
+                ("num", numeric_transformer, numeric_features),
+                ("cat", categorical_transformer, categorical_features),
+            ]
+        )
+        encoded = preprocessor.fit_transform(x)
+        return encoded
diff --git a/tests/test_anonymizer.py b/tests/test_anonymizer.py
index 466c129..000eefa 100644
--- a/tests/test_anonymizer.py
+++ b/tests/test_anonymizer.py
@@ -1,5 +1,8 @@
 import pytest
 import numpy as np
+from sklearn.compose import ColumnTransformer
+from sklearn.impute import SimpleImputer
+from sklearn.pipeline import Pipeline
 from sklearn.tree import DecisionTreeClassifier, DecisionTreeRegressor
 from sklearn.preprocessing import OneHotEncoder
 
@@ -17,7 +20,7 @@ def test_anonymize_ndarray_iris():
 
     k = 10
     QI = [0, 2]
-    anonymizer = Anonymize(k, QI)
+    anonymizer = Anonymize(k, QI, train_only_QI=True)
     anon = anonymizer.anonymize(x_train, pred)
     assert(len(np.unique(anon[:, QI], axis=0)) < len(np.unique(x_train[:, QI], axis=0)))
     _, counts_elements = np.unique(anon[:, QI], return_counts=True)
@@ -27,16 +30,31 @@ def test_anonymize_ndarray_iris():
 
 def test_anonymize_pandas_adult():
     (x_train, y_train), _ = get_adult_dataset()
-    encoded = OneHotEncoder().fit_transform(x_train)
-    model = DecisionTreeClassifier()
-    model.fit(encoded, y_train)
-    pred = model.predict(encoded)
 
     k = 100
+    features = ['age', 'workclass', 'education-num', 'marital-status', 'occupation',
+                'relationship', 'race', 'sex', 'capital-gain', 'capital-loss', 'hours-per-week', 'native-country']
     QI = ['age', 'workclass', 'education-num', 'marital-status', 'occupation', 'relationship', 'race', 'sex',
           'native-country']
     categorical_features = ['workclass', 'marital-status', 'occupation', 'relationship', 'race', 'sex',
                             'native-country']
+    # prepare data for DT
+    numeric_features = [f for f in features if f not in categorical_features]
+    numeric_transformer = Pipeline(
+        steps=[('imputer', SimpleImputer(strategy='constant', fill_value=0))]
+    )
+    categorical_transformer = OneHotEncoder(handle_unknown="ignore", sparse=False)
+    preprocessor = ColumnTransformer(
+        transformers=[
+            ("num", numeric_transformer, numeric_features),
+            ("cat", categorical_transformer, categorical_features),
+        ]
+    )
+    encoded = preprocessor.fit_transform(x_train)
+    model = DecisionTreeClassifier()
+    model.fit(encoded, y_train)
+    pred = model.predict(encoded)
+
     anonymizer = Anonymize(k, QI, categorical_features=categorical_features)
     anon = anonymizer.anonymize(x_train, pred)
 
@@ -48,15 +66,29 @@ def test_anonymize_pandas_adult():
 def test_anonymize_pandas_nursery():
     (x_train, y_train), _ = get_nursery_dataset()
     x_train = x_train.astype(str)
-    encoded = OneHotEncoder().fit_transform(x_train)
+
+    k = 100
+    features = ["parents", "has_nurs", "form", "children", "housing", "finance", "social", "health"]
+    QI = ["finance", "social", "health"]
+    categorical_features = ["parents", "has_nurs", "form", "housing", "finance", "social", "health", 'children']
+    # prepare data for DT
+    numeric_features = [f for f in features if f not in categorical_features]
+    numeric_transformer = Pipeline(
+        steps=[('imputer', SimpleImputer(strategy='constant', fill_value=0))]
+    )
+    categorical_transformer = OneHotEncoder(handle_unknown="ignore", sparse=False)
+    preprocessor = ColumnTransformer(
+        transformers=[
+            ("num", numeric_transformer, numeric_features),
+            ("cat", categorical_transformer, categorical_features),
+        ]
+    )
+    encoded = preprocessor.fit_transform(x_train)
     model = DecisionTreeClassifier()
     model.fit(encoded, y_train)
     pred = model.predict(encoded)
 
-    k = 100
-    QI = ["finance", "social", "health"]
-    categorical_features = ["parents", "has_nurs", "form", "housing", "finance", "social", "health", 'children']
-    anonymizer = Anonymize(k, QI, categorical_features=categorical_features)
+    anonymizer = Anonymize(k, QI, categorical_features=categorical_features, train_only_QI=True)
     anon = anonymizer.anonymize(x_train, pred)
 
     assert(anon.loc[:, QI].drop_duplicates().shape[0] < x_train.loc[:, QI].drop_duplicates().shape[0])
@@ -74,7 +106,7 @@ def test_regression():
     pred = model.predict(x_train)
     k = 10
     QI = [0, 2, 5, 8]
-    anonymizer = Anonymize(k, QI, is_regression=True)
+    anonymizer = Anonymize(k, QI, is_regression=True, train_only_QI=True)
     anon = anonymizer.anonymize(x_train, pred)
     print('Base model accuracy (R2 score): ', model.score(x_test, y_test))
     model.fit(anon, y_train)

From 2b2dab6bef88352e95fd8763ca1777d269e92e0e Mon Sep 17 00:00:00 2001
From: abigailgold <57357634+abigailgold@users.noreply.github.com>
Date: Wed, 27 Apr 2022 12:33:27 +0300
Subject: [PATCH 05/26] Data and Model wrappers (#26)

* Squashed commit of wrappers:

    Wrapper minimizer

    * apply dataset wrapper on minimizer
    * apply changes on minimization notebook
    * add black_box_access and unlimited_queries params

    Dataset wrapper anonymizer

    Add features_names to ArrayDataset
    and allow providing features names in QI and Cat features not just indexes

    update notebooks

    categorical features and QI passed by indexes
    dataset include feature names and is_pandas param

    add pytorch Dataset

    Remove redundant code.
    Use data wrappers in model wrapper APIs.

    add generic dataset components

    Create initial version of wrappers for models

* Fix handling of categorical features
---
 apt/anonymization/anonymizer.py               | 104 ++--
 apt/minimization/minimizer.py                 | 189 ++++---
 apt/utils/__init__.py                         |   0
 apt/{utils.py => utils/dataset_utils.py}      |  27 +-
 apt/utils/datasets/__init__.py                |   7 +
 apt/utils/datasets/datasets.py                | 320 +++++++++++
 apt/utils/models/__init__.py                  |   2 +
 apt/utils/models/model.py                     | 109 ++++
 apt/utils/models/sklearn_model.py             | 112 ++++
 ...bute_inference_anonymization_nursery.ipynb | 523 +++---------------
 ...ership_inference_anonymization_adult.ipynb |  80 ++-
 ...membership_inference_dp_diabetes_reg.ipynb |  33 +-
 notebooks/minimization_adult.ipynb            |  85 +--
 requirements.txt                              |   1 +
 tests/test_anonymizer.py                      |  29 +-
 tests/test_minimizer.py                       | 436 ++++++++++++---
 tests/test_model.py                           |  35 ++
 17 files changed, 1340 insertions(+), 752 deletions(-)
 create mode 100644 apt/utils/__init__.py
 rename apt/{utils.py => utils/dataset_utils.py} (93%)
 create mode 100644 apt/utils/datasets/__init__.py
 create mode 100644 apt/utils/datasets/datasets.py
 create mode 100644 apt/utils/models/__init__.py
 create mode 100644 apt/utils/models/model.py
 create mode 100644 apt/utils/models/sklearn_model.py
 create mode 100644 tests/test_model.py

diff --git a/apt/anonymization/anonymizer.py b/apt/anonymization/anonymizer.py
index 9f82c7c..02854f5 100644
--- a/apt/anonymization/anonymizer.py
+++ b/apt/anonymization/anonymizer.py
@@ -8,6 +8,7 @@ from sklearn.impute import SimpleImputer
 from sklearn.pipeline import Pipeline
 from sklearn.tree import DecisionTreeClassifier, DecisionTreeRegressor
 from sklearn.preprocessing import OneHotEncoder
+from apt.utils.datasets import ArrayDataset, DATA_PANDAS_NUMPY_TYPE
 
 from typing import Union, Optional
 
@@ -49,61 +50,64 @@ class Anonymize:
         self.categorical_features = categorical_features
         self.is_regression = is_regression
         self.train_only_QI = train_only_QI
+        self.features_names = None
+        self.features = None
 
-    def anonymize(self, x: Union[np.ndarray, pd.DataFrame], y: Union[np.ndarray, pd.DataFrame]) \
-            -> Union[np.ndarray, pd.DataFrame]:
+    def anonymize(self, dataset: ArrayDataset) -> DATA_PANDAS_NUMPY_TYPE:
         """
         Method for performing model-guided anonymization.
 
-        :param x: The training data for the model. If provided as a pandas dataframe, may contain both numeric and
-                  categorical data.
-        :param y: The predictions of the original model on the training data.
+        :param dataset: Data wrapper containing the training data for the model and the predictions of the
+                        original model on the training data.
         :return: An array containing the anonymized training dataset.
         """
-        if type(x) == np.ndarray:
-            self.features = [i for i in range(x.shape[1])]
-            return self._anonymize_ndarray(x.copy(), y)
-        else:  # pandas
-            self.features = x.columns
-            if not self.categorical_features:
-                raise ValueError('When supplying a pandas dataframe, categorical_features must be defined')
-            return self._anonymize_pandas(x.copy(), y)
+        if dataset.get_samples().shape[1] != 0:
+            self.features = [i for i in range(dataset.get_samples().shape[1])]
+        else:
+            raise ValueError('No data provided')
 
-    def _anonymize_ndarray(self, x, y):
+        if dataset.features_names is not None:
+            self.features_names = dataset.features_names
+        else: # if no names provided, use numbers instead
+            self.features_names = self.features
+
+        if not set(self.quasi_identifiers).issubset(set(self.features_names)):
+            raise ValueError('Quasi identifiers should bs a subset of the supplied features or indexes in range of '
+                             'the data columns')
+        if self.categorical_features and not set(self.categorical_features).issubset(set(self.features_names)):
+            raise ValueError('Categorical features should bs a subset of the supplied features or indexes in range of '
+                             'the data columns')
+        self.quasi_identifiers = [i for i, v in enumerate(self.features_names) if v in self.quasi_identifiers]
+        if self.categorical_features:
+            self.categorical_features = [i for i, v in enumerate(self.features_names) if v in self.categorical_features]
+
+        transformed = self._anonymize(dataset.get_samples().copy(), dataset.get_labels())
+        if dataset.is_pandas:
+            return pd.DataFrame(transformed, columns=self.features_names)
+        else:
+            return transformed
+
+    def _anonymize(self, x, y):
         if x.shape[0] != y.shape[0]:
             raise ValueError("x and y should have same number of rows")
-        x_anonymizer_train = x
-        if self.train_only_QI:
-            # build DT just on QI features
-            x_anonymizer_train = x[:, self.quasi_identifiers]
         if x.dtype.kind not in 'iufc':
-            x_prepared = self._modify_categorical_features(x_anonymizer_train)
+            if not self.categorical_features:
+                raise ValueError('when supplying an array with non-numeric data, categorical_features must be defined')
+            x_prepared = self._modify_categorical_features(x)
         else:
-            x_prepared = x_anonymizer_train
-        if self.is_regression:
-            self.anonymizer = DecisionTreeRegressor(random_state=10, min_samples_split=2, min_samples_leaf=self.k)
-        else:
-            self.anonymizer = DecisionTreeClassifier(random_state=10, min_samples_split=2, min_samples_leaf=self.k)
-        self.anonymizer.fit(x_prepared, y)
-        cells_by_id = self._calculate_cells(x, x_prepared)
-        return self._anonymize_data_numpy(x, x_prepared, cells_by_id)
-
-    def _anonymize_pandas(self, x, y):
-        if x.shape[0] != y.shape[0]:
-            raise ValueError("x and y should have same number of rows")
-        x_anonymizer_train = x
+            x_prepared = x
+        x_anonymizer_train = x_prepared
         if self.train_only_QI:
             # build DT just on QI features
-            x_anonymizer_train = x.loc[:, self.quasi_identifiers]
-        # need to one-hot encode before training the decision tree
-        x_prepared = self._modify_categorical_features(x_anonymizer_train)
+            x_anonymizer_train = x_prepared[:, self.quasi_identifiers]
         if self.is_regression:
             self.anonymizer = DecisionTreeRegressor(random_state=10, min_samples_split=2, min_samples_leaf=self.k)
         else:
             self.anonymizer = DecisionTreeClassifier(random_state=10, min_samples_split=2, min_samples_leaf=self.k)
-        self.anonymizer.fit(x_prepared, y)
-        cells_by_id = self._calculate_cells(x, x_prepared)
-        return self._anonymize_data_pandas(x, x_prepared, cells_by_id)
+
+        self.anonymizer.fit(x_anonymizer_train, y)
+        cells_by_id = self._calculate_cells(x, x_anonymizer_train)
+        return self._anonymize_data(x, x_anonymizer_train, cells_by_id)
 
     def _calculate_cells(self, x, x_anonymizer_train):
         # x is original data, x_anonymizer_train is only QIs + 1-hot encoded
@@ -130,15 +134,9 @@ class Anonymize:
             # get all rows in cell
             indexes = [index for index, node_id in enumerate(node_ids) if node_id == cell['id']]
             # TODO: should we filter only those with majority label? (using hist)
-            if type(x) == np.ndarray:
-                rows = x[indexes]
-            else:  # pandas
-                rows = x.iloc[indexes]
+            rows = x[indexes]
             for feature in self.quasi_identifiers:
-                if type(x) == np.ndarray:
-                    values = rows[:, feature]
-                else:  # pandas
-                    values = rows.loc[:, feature]
+                values = rows[:, feature]
                 if self.categorical_features and feature in self.categorical_features:
                     # find most common value
                     cell['representative'][feature] = Counter(values).most_common(1)[0][0]
@@ -163,7 +161,7 @@ class Anonymize:
         node_ids = self._find_sample_nodes(samples)
         return [cells_by_id[node_id] for node_id in node_ids]
 
-    def _anonymize_data_numpy(self, x, x_anonymizer_train, cells_by_id):
+    def _anonymize_data(self, x, x_anonymizer_train, cells_by_id):
         cells = self._find_sample_cells(x_anonymizer_train, cells_by_id)
         index = 0
         for row in x:
@@ -173,22 +171,12 @@ class Anonymize:
                 row[feature] = cell['representative'][feature]
         return x
 
-    def _anonymize_data_pandas(self, x, x_anonymizer_train, cells_by_id):
-        cells = self._find_sample_cells(x_anonymizer_train, cells_by_id)
-        index = 0
-        for i, row in x.iterrows():
-            cell = cells[index]
-            index += 1
-            for feature in cell['representative']:
-                x.at[i, feature] = cell['representative'][feature]
-        return x
-
     def _modify_categorical_features(self, x):
         # prepare data for DT
         used_features = self.features
         if self.train_only_QI:
             used_features = self.quasi_identifiers
-        numeric_features = [f for f in x.columns if f in used_features and f not in self.categorical_features]
+        numeric_features = [f for f in self.features if f in used_features and f not in self.categorical_features]
         categorical_features = [f for f in self.categorical_features if f in used_features]
         numeric_transformer = Pipeline(
             steps=[('imputer', SimpleImputer(strategy='constant', fill_value=0))]
diff --git a/apt/minimization/minimizer.py b/apt/minimization/minimizer.py
index d04cc03..27b6b6e 100644
--- a/apt/minimization/minimizer.py
+++ b/apt/minimization/minimizer.py
@@ -1,7 +1,7 @@
 """
 This module implements all classes needed to perform data minimization
 """
-from typing import Union
+from typing import Union, Optional
 import pandas as pd
 import numpy as np
 import copy
@@ -16,6 +16,9 @@ from sklearn.utils.validation import check_X_y, check_array, check_is_fitted
 from sklearn.tree import DecisionTreeClassifier, DecisionTreeRegressor
 from sklearn.model_selection import train_test_split
 
+from apt.utils.datasets import ArrayDataset, Data, DATA_PANDAS_NUMPY_TYPE
+from apt.utils.models import Model, SklearnRegressor, ModelOutputType, SklearnClassifier
+
 
 class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerMixin):
     """ A transformer that generalizes data to representative points.
@@ -24,16 +27,13 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
     and a target accuracy. Once the generalizations are learned, can
     receive one or more data records and transform them to representative
     points based on the learned generalization.
-
-    An alternative way to use the transformer is to supply ``cells`` and
-    ``features`` in init or set_params and those will be used to transform
+    An alternative way to use the transformer is to supply ``cells`` in
+    init or set_params and those will be used to transform
     data to representatives. In this case, fit must still be called but
     there is no need to supply it with ``X`` and ``y``, and there is no
     need to supply an existing ``estimator`` to init.
-
     In summary, either ``estimator`` and ``target_accuracy`` should be
-    supplied or ``cells`` and ``features`` should be supplied.
-
+    supplied or ``cells`` should be supplied.
     Parameters
     ----------
     estimator : estimator, optional
@@ -43,8 +43,6 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
         The required accuracy when applying the base model to the
         generalized data. Accuracy is measured relative to the original
         accuracy of the model.
-    features : list of str, optional
-        The feature names, in the order that they appear in the data.
     categorical_features: list of str, optional
         The list of categorical features should only be supplied when
          passing data as a pandas dataframe.
@@ -67,28 +65,29 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
 
     Attributes
     ----------
+    features_ : list of str
+        The feature names, in the order that they appear in the data.
     cells_ : list of object
         The cells used to generalize records, as learned when calling fit.
-
     ncp_ : float
         The NCP (information loss) score of the resulting generalization,
         as measured on the training data.
-
     generalizations_ : object
         The generalizations that were learned (actual feature ranges).
-
-    Notes
-    -----
-
-
     """
 
-    def __init__(self, estimator=None, target_accuracy=0.998, features=None,
-                 cells=None, categorical_features=None, features_to_minimize: Union[np.ndarray, list] = None
-                 , train_only_QI=True, is_regression=False):
-        self.estimator = estimator
+    def __init__(self, estimator: Union[BaseEstimator, Model] = None, target_accuracy: float = 0.998,
+                 cells: list = None, categorical_features: Union[np.ndarray, list] = None,
+                 features_to_minimize: Union[np.ndarray, list] = None, train_only_QI: bool = True,
+                 is_regression: bool = False):
+        if issubclass(estimator.__class__, Model):
+            self.estimator = estimator
+        else:
+            if is_regression:
+                self.estimator = SklearnRegressor(estimator)
+            else:
+                self.estimator = SklearnClassifier(estimator, ModelOutputType.CLASSIFIER_VECTOR)
         self.target_accuracy = target_accuracy
-        self.features = features
         self.cells = cells
         self.categorical_features = []
         if categorical_features:
@@ -114,11 +113,9 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
         ret = {}
         ret['target_accuracy'] = self.target_accuracy
         if deep:
-            ret['features'] = copy.deepcopy(self.features)
             ret['cells'] = copy.deepcopy(self.cells)
             ret['estimator'] = self.estimator
         else:
-            ret['features'] = copy.copy(self.features)
             ret['cells'] = copy.copy(self.cells)
         return ret
 
@@ -132,8 +129,6 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
         """
         if 'target_accuracy' in params:
             self.target_accuracy = params['target_accuracy']
-        if 'features' in params:
-            self.features = params['features']
         if 'cells' in params:
             self.cells = params['cells']
         return self
@@ -142,7 +137,8 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
     def generalizations(self):
         return self.generalizations_
 
-    def fit_transform(self, X: Union[np.ndarray, pd.DataFrame] = None, y: Union[np.ndarray, pd.DataFrame] = None):
+    def fit_transform(self, X: Optional[DATA_PANDAS_NUMPY_TYPE] = None, y: Optional[DATA_PANDAS_NUMPY_TYPE] = None,
+                      features_names: Optional = None, dataset: Optional[ArrayDataset] = None):
         """Learns the generalizations based on training data, and applies them to the data.
 
         Parameters
@@ -152,17 +148,22 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
         y : array-like, shape (n_samples,), optional
             The target values. An array of int.
             This should contain the predictions of the original model on ``X``.
-
+        features_names : list of str, The feature names, in the order that they appear in the data,
+                        provided just if X and y were provided (optional).
+        dataset : Data wrapper containing the training input samples and the predictions of the
+                  original model on the training data.
+        Either X,y OR dataset need to be provided, not both.
         Returns
         -------
         X_transformed : numpy or pandas according to the input type, shape (n_samples, n_features)
             The array containing the representative values to which each record in
             ``X`` is mapped.
         """
-        self.fit(X, y)
-        return self.transform(X)
+        self.fit(X, y, features_names, dataset=dataset)
+        return self.transform(X, features_names, dataset=dataset)
 
-    def fit(self, X: Union[np.ndarray, pd.DataFrame] = None, y: Union[np.ndarray, pd.DataFrame] = None):
+    def fit(self, X: Optional[DATA_PANDAS_NUMPY_TYPE] = None, y: Optional[DATA_PANDAS_NUMPY_TYPE] = None,
+            features_names: Optional = None, dataset: ArrayDataset = None):
         """Learns the generalizations based on training data.
 
         Parameters
@@ -172,7 +173,11 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
         y : array-like, shape (n_samples,), optional
             The target values. An array of int.
             This should contain the predictions of the original model on ``X``.
-
+        features_names : list of str, The feature names, in the order that they appear in the data,
+                        provided just if X and y were provided (optional).
+        dataset : Data wrapper containing the training input samples and the predictions of the
+                  original model on the training data.
+        Either X,y OR dataset need to be provided, not both.
         Returns
         -------
         X_transformed : numpy or pandas according to the input type, shape (n_samples, n_features)
@@ -181,26 +186,25 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
         """
 
         # take into account that estimator, X, y, cells, features may be None
-        if X is not None:
-            if type(X) == np.ndarray:
-                self.is_numpy = True
-            else:
-                self.is_numpy = False
-
         if X is not None and y is not None:
-            if self.is_numpy:
-                X, y = check_X_y(X, y, accept_sparse=True)
-            self.n_features_ = X.shape[1]
-        elif self.features:
-            self.n_features_ = len(self.features)
+            if dataset is not None:
+                raise ValueError('Either X,y OR dataset need to be provided, not both')
+            else:
+                dataset = ArrayDataset(X, y, features_names)
+
+        if dataset and dataset.get_samples() is not None and dataset.get_labels() is not None:
+            self.n_features_ = dataset.get_samples().shape[1]
+
+        elif dataset and dataset.features_names:
+            self.n_features_ = len(dataset.features_names)
         else:
             self.n_features_ = 0
 
-        if self.features:
-            self._features = self.features
+        if dataset and dataset.features_names:
+            self._features = dataset.features_names
         # if features is None, use numbers instead of names
         elif self.n_features_ != 0:
-            self._features = [i for i in range(self.n_features_)]
+            self._features = [str(i) for i in range(self.n_features_)]
         else:
             self._features = None
 
@@ -212,27 +216,24 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
 
         # Going to fit
         # (currently not dealing with option to fit with only X and y and no estimator)
-        if self.estimator and X is not None and y is not None:
+        if self.estimator and dataset and dataset.get_samples() is not None and dataset.get_labels() is not None:
+            x = pd.DataFrame(dataset.get_samples(), columns=self._features)
+            if not self.features_to_minimize:
+                self.features_to_minimize = self._features
+            self.features_to_minimize = [str(i) for i in self.features_to_minimize]
+            if not all(elem in self._features for elem in self.features_to_minimize):
+                raise ValueError('features to minimize should be a subset of features names')
+            x_QI = x.loc[:, self.features_to_minimize]
 
-            if self.is_numpy:
-                if not self.features_to_minimize:
-                    self.features_to_minimize = [i for i in range(len(self._features))]
-                x_QI = X[:, self.features_to_minimize]
-                self.features_to_minimize = [self._features[i] for i in self.features_to_minimize]
-                X = pd.DataFrame(X, columns=self._features)
-            else:
-                if not self.features_to_minimize:
-                    self.features_to_minimize = self._features
-                x_QI = X.loc[:, self.features_to_minimize]
-            x_QI = pd.DataFrame(x_QI, columns=self.features_to_minimize)
             # divide dataset into train and test
-            used_data = X
+            used_data = x
             if self.train_only_QI:
                 used_data = x_QI
             if self.is_regression:
-                X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.4, random_state=14)
+                X_train, X_test, y_train, y_test = train_test_split(x, dataset.get_labels(), test_size=0.4, random_state=14)
             else:
-                X_train, X_test, y_train, y_test = train_test_split(X, y, stratify=y, test_size=0.4, random_state=18)
+                X_train, X_test, y_train, y_test = train_test_split(x, dataset.get_labels(), stratify=dataset.get_labels(), test_size=0.4,
+                                                                    random_state=18)
 
             X_train_QI = X_train.loc[:, self.features_to_minimize]
             X_test_QI = X_test.loc[:, self.features_to_minimize]
@@ -246,7 +247,7 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
             for feature in self._features:
                 if feature not in feature_data.keys():
                     fd = {}
-                    values = list(X.loc[:, feature])
+                    values = list(x.loc[:, feature])
                     if feature not in self.categorical_features:
                         fd['min'] = min(values)
                         fd['max'] = max(values)
@@ -259,7 +260,6 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
             categorical_features = [f for f in self._features if f in self.categorical_features and
                                     f in self.features_to_minimize]
 
-
             numeric_transformer = Pipeline(
                 steps=[('imputer', SimpleImputer(strategy='constant', fill_value=0))]
             )
@@ -288,7 +288,7 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
                     ("cat", categorical_transformer, self.categorical_features),
                 ]
             )
-            preprocessor.fit(X)
+            preprocessor.fit(x)
             x_prepared = preprocessor.transform(X_train)
             if self.train_only_QI:
                 x_prepared = preprocessor_QI_features.transform(X_train_QI)
@@ -300,7 +300,7 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
                 self.dt_ = DecisionTreeRegressor(random_state=10, min_samples_split=2, min_samples_leaf=1)
             else:
                 self.dt_ = DecisionTreeClassifier(random_state=0, min_samples_split=2,
-                                              min_samples_leaf=1)
+                                                  min_samples_leaf=1)
             self.dt_.fit(x_prepared, y_train)
             self._modify_categorical_features(used_data)
 
@@ -329,7 +329,7 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
             generalized = self._generalize(X_test, x_prepared_test, nodes, self.cells_, self.cells_by_id_)
 
             # check accuracy
-            accuracy = self.estimator.score(preprocessor.transform(generalized), y_test)
+            accuracy = self.estimator.score(ArrayDataset(preprocessor.transform(generalized), y_test))
             print('Initial accuracy of model on generalized data, relative to original model predictions '
                   '(base generalization derived from tree, before improvements): %f' % accuracy)
 
@@ -349,7 +349,7 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
                         self._calculate_generalizations()
                         generalized = self._generalize(X_test, x_prepared_test, nodes, self.cells_,
                                                        self.cells_by_id_)
-                        accuracy = self.estimator.score(preprocessor.transform(generalized), y_test)
+                        accuracy = self.estimator.score(ArrayDataset(preprocessor.transform(generalized), y_test))
                         # if accuracy passed threshold roll back to previous iteration generalizations
                         if accuracy < self.target_accuracy:
                             self.cells_ = cells_previous_iter
@@ -375,7 +375,7 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
 
                     self._calculate_generalizations()
                     generalized = self._generalize(X_test, x_prepared_test, nodes, self.cells_, self.cells_by_id_)
-                    accuracy = self.estimator.score(preprocessor.transform(generalized), y_test)
+                    accuracy = self.estimator.score(ArrayDataset(preprocessor.transform(generalized), y_test))
                     print('Removed feature: %s, new relative accuracy: %f' % (removed_feature, accuracy))
 
             # self.cells_ currently holds the chosen generalization based on target accuracy
@@ -386,7 +386,7 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
         # Return the transformer
         return self
 
-    def transform(self, X: Union[np.ndarray, pd.DataFrame]):
+    def transform(self, X: Optional[DATA_PANDAS_NUMPY_TYPE] = None, features_names: Optional = None, dataset: ArrayDataset = None):
         """ Transforms data records to representative points.
 
         Parameters
@@ -394,6 +394,10 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
         X : {array-like, sparse-matrix}, shape (n_samples, n_features), If provided as a pandas dataframe,
          may contain both numeric and categorical data.
             The input samples.
+        features_names : list of str, The feature names, in the order that they appear in the data,
+                        provided just if X was provided (optional).
+        dataset : Data wrapper containing the training input samples.
+        Either X OR dataset need to be provided, not both.
         Returns
         -------
         X_transformed : numpy or pandas according to the input type, shape (n_samples, n_features)
@@ -405,26 +409,30 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
         msg = 'This %(name)s instance is not initialized yet. ' \
               'Call ‘fit’ or ‘set_params’ with ' \
               'appropriate arguments before using this method.'
-        check_is_fitted(self, ['cells', 'features'], msg=msg)
+        check_is_fitted(self, ['cells'], msg=msg)
 
-        if type(X) == np.ndarray:
-            # Input validation
-            X = check_array(X, accept_sparse=True)
-            self.is_numpy = True
-            X = pd.DataFrame(X, columns=self._features)
-        else:
-            self.is_numpy = False
+        if X is not None:
+            if dataset is not None:
+                raise ValueError('Either X OR dataset need to be provided, not both')
+            else:
+                dataset = ArrayDataset(X, features_names=features_names)
+        elif dataset is None:
+            raise ValueError('Either X OR dataset need to be provided, not both')
+        if dataset and dataset.features_names:
+            self._features = dataset.features_names
+        if dataset and dataset.get_samples() is not None:
+            x = pd.DataFrame(dataset.get_samples(), columns=self._features)
 
-        if X.shape[1] != self.n_features_ and self.n_features_ != 0:
+        if x.shape[1] != self.n_features_ and self.n_features_ != 0:
             raise ValueError('Shape of input is different from what was seen'
                              'in `fit`')
 
         if not self._features:
-            self._features = [i for i in range(X.shape[1])]
+            self._features = [i for i in range(x.shape[1])]
 
         representatives = pd.DataFrame(columns=self._features)  # only columns
-        generalized = pd.DataFrame(X, columns=self._features, copy=True)  # original data
-        mapped = np.zeros(X.shape[0])  # to mark records we already mapped
+        generalized = pd.DataFrame(x, columns=self._features, copy=True)  # original data
+        mapped = np.zeros(x.shape[0])  # to mark records we already mapped
 
         # iterate over cells (leaves in decision tree)
         for i in range(len(self.cells_)):
@@ -443,7 +451,7 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
                     representatives = representatives.drop(feature, axis=1)
 
             # get the indexes of all records that map to this cell
-            indexes = self._get_record_indexes_for_cell(X, self.cells_[i], mapped)
+            indexes = self._get_record_indexes_for_cell(x, self.cells_[i], mapped)
 
             # replace the values in the representative columns with the representative
             # values (leaves others untouched)
@@ -454,9 +462,11 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
                     replace = representatives.loc[i].to_frame().T.reset_index(drop=True)
                 replace.index = indexes
                 generalized.loc[indexes, representatives.columns] = replace
-        if self.is_numpy:
-            return generalized.to_numpy()
-        return generalized
+        if dataset and dataset.is_pandas:
+            return generalized
+        elif isinstance(X, pd.DataFrame):
+            return generalized
+        return generalized.to_numpy()
 
     def _get_record_indexes_for_cell(self, X, cell, mapped):
         indexes = []
@@ -640,7 +650,8 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
             # else: nothing to do, stay with previous cells
 
     def _calculate_level_cell_label(self, left_cell, right_cell, new_cell):
-        new_cell['hist'] = [x + y for x, y in zip(left_cell['hist'], right_cell['hist'])] if not self.is_regression else []
+        new_cell['hist'] = [x + y for x, y in
+                            zip(left_cell['hist'], right_cell['hist'])] if not self.is_regression else []
         new_cell['label'] = int(self.dt_.classes_[np.argmax(new_cell['hist'])]) if not self.is_regression else 1
 
     def _get_nodes_level(self, level):
@@ -797,8 +808,8 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
                     cells_by_id = copy.deepcopy(self.cells_by_id_)
                     GeneralizeToRepresentative._remove_feature_from_cells(new_cells, cells_by_id, feature)
                     generalized = self._generalize(original_data, prepared_data, nodes, new_cells, cells_by_id)
-                    accuracy_gain = self.estimator.score(self._preprocessor.transform(generalized),
-                                                         labels) - current_accuracy
+                    accuracy_gain = self.estimator.score(ArrayDataset(self._preprocessor.transform(generalized),
+                                                                      labels)) - current_accuracy
                     if accuracy_gain < 0:
                         accuracy_gain = 0
                     if accuracy_gain != 0:
@@ -820,8 +831,8 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
                     cells_by_id = copy.deepcopy(self.cells_by_id_)
                     GeneralizeToRepresentative._remove_feature_from_cells(new_cells, cells_by_id, feature)
                     generalized = self._generalize(original_data, prepared_data, nodes, new_cells, cells_by_id)
-                    accuracy_gain = self.estimator.score(self._preprocessor.transform(generalized),
-                                                         labels) - current_accuracy
+                    accuracy_gain = self.estimator.score(ArrayDataset(self._preprocessor.transform(generalized),
+                                                                      labels)) - current_accuracy
 
                     if accuracy_gain < 0:
                         accuracy_gain = 0
diff --git a/apt/utils/__init__.py b/apt/utils/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/apt/utils.py b/apt/utils/dataset_utils.py
similarity index 93%
rename from apt/utils.py
rename to apt/utils/dataset_utils.py
index bc73cbc..e3eb959 100644
--- a/apt/utils.py
+++ b/apt/utils/dataset_utils.py
@@ -13,8 +13,7 @@ def _load_iris(test_set_size: float = 0.3):
 
     # Split training and test sets
     x_train, x_test, y_train, y_test = model_selection.train_test_split(data, labels, test_size=test_set_size,
-                                                                        random_state=18, stratify=labels,
-                                                                        shuffle=True)
+                                                                                random_state=18, stratify=labels)
 
     return (x_train, y_train), (x_test, y_test)
 
@@ -29,6 +28,28 @@ def get_iris_dataset(test_set: float = 0.3):
     return _load_iris(test_set)
 
 
+def _load_diabetes(test_set_size: float = 0.3):
+    diabetes = datasets.load_diabetes()
+    data = diabetes.data
+    labels = diabetes.target
+
+    # Split training and test sets
+    x_train, x_test, y_train, y_test = model_selection.train_test_split(data, labels, test_size=test_set_size,
+                                                                        random_state=18)
+
+    return (x_train, y_train), (x_test, y_test)
+
+
+def get_diabetes_dataset():
+    """
+    Loads the Iris dataset from scikit-learn.
+
+    :param test_set: Proportion of the data to use as validation split (value between 0 and 1).
+    :return: Entire dataset and labels as numpy array.
+    """
+    return _load_diabetes()
+
+
 def get_german_credit_dataset(test_set: float = 0.3):
     """
     Loads the UCI German_credit dataset from `tests/datasets/german` or downloads it if necessary.
@@ -253,7 +274,7 @@ def get_nursery_dataset(raw: bool = True, test_set: float = 0.2, transform_socia
             raise Exception("Bad label value: %s" % value)
 
     data["label"] = data["label"].apply(modify_label)
-    data["children"] = data["children"].apply(lambda x: 4 if x == "more" else x)
+    data["children"] = data["children"].apply(lambda x: "4" if x == "more" else x)
 
     if transform_social:
 
diff --git a/apt/utils/datasets/__init__.py b/apt/utils/datasets/__init__.py
new file mode 100644
index 0000000..6e7c640
--- /dev/null
+++ b/apt/utils/datasets/__init__.py
@@ -0,0 +1,7 @@
+"""
+The AI Privacy Toolbox (datasets).
+Implementation of datasets utility components for datasets creation, load, and store
+"""
+
+from apt.utils.datasets.datasets import Dataset, StoredDataset, DatasetFactory, Data, ArrayDataset, \
+    OUTPUT_DATA_ARRAY_TYPE, DATA_PANDAS_NUMPY_TYPE
diff --git a/apt/utils/datasets/datasets.py b/apt/utils/datasets/datasets.py
new file mode 100644
index 0000000..ff7c296
--- /dev/null
+++ b/apt/utils/datasets/datasets.py
@@ -0,0 +1,320 @@
+# !/usr/bin/env python
+"""
+The AI Privacy Toolbox (datasets).
+Implementation of utility classes for dataset handling
+"""
+
+from abc import ABCMeta, abstractmethod
+from typing import Callable, Collection, Any, Union, List, Optional
+
+import tarfile
+import os
+import urllib.request
+import numpy as np
+import pandas as pd
+import logging
+import torch
+from torch import Tensor
+
+logger = logging.getLogger(__name__)
+
+
+INPUT_DATA_ARRAY_TYPE = Union[np.ndarray, pd.DataFrame, List, Tensor]
+OUTPUT_DATA_ARRAY_TYPE = np.ndarray
+DATA_PANDAS_NUMPY_TYPE = Union[np.ndarray, pd.DataFrame]
+
+
+def array2numpy(self, arr: INPUT_DATA_ARRAY_TYPE) -> OUTPUT_DATA_ARRAY_TYPE:
+
+    """
+    converts from INPUT_DATA_ARRAY_TYPE to numpy array
+    """
+    if type(arr) == np.ndarray:
+        return arr
+    if type(arr) == pd.DataFrame or type(arr) == pd.Series:
+        self.is_pandas = True
+        return arr.to_numpy()
+    if isinstance(arr, list):
+        return np.array(arr)
+    if type(arr) == Tensor:
+        return arr.detach().cpu().numpy()
+
+    raise ValueError('Non supported type: ', type(arr).__name__)
+
+
+def array2torch_tensor(self, arr: INPUT_DATA_ARRAY_TYPE) -> Tensor:
+    """
+    converts from INPUT_DATA_ARRAY_TYPE to torch tensor array
+    """
+    if type(arr) == np.ndarray:
+        return torch.from_numpy(arr)
+    if type(arr) == pd.DataFrame or type(arr) == pd.Series:
+        self.is_pandas = True
+        return torch.from_numpy(arr.to_numpy())
+    if isinstance(arr, list):
+        return torch.tensor(arr)
+    if type(arr) == Tensor:
+        return arr
+
+    raise ValueError('Non supported type: ', type(arr).__name__)
+
+
+class Dataset(metaclass=ABCMeta):
+    """Base Abstract Class for Dataset"""
+
+    @abstractmethod
+    def __init__(self, **kwargs):
+        pass
+
+    @abstractmethod
+    def get_samples(self) -> Collection[Any]:
+        """Return data samples"""
+        pass
+
+    @abstractmethod
+    def get_labels(self) -> Collection[Any]:
+        """Return labels"""
+        pass
+
+
+class StoredDataset(Dataset):
+    """Abstract Class for Storable Dataset"""
+
+    @abstractmethod
+    def load_from_file(self, path: str):
+        """Load dataset from file"""
+        pass
+
+    @abstractmethod
+    def load(self, **kwargs):
+        """Load dataset"""
+        pass
+
+    @staticmethod
+    def download(url: str, dest_path: str, filename: str, unzip: bool = False) -> None:
+        """
+        Download the dataset from URL
+        :param url: dataset URL, the dataset will be requested from this URL
+        :param dest_path: local dataset destination path
+        :param filename: local dataset filename
+        :param unzip: flag whether or not perform extraction
+        :return: None
+        """
+        file_path = os.path.join(dest_path, filename)
+
+        if os.path.exists(file_path):
+            logger.warning("Files already downloaded, skipping downloading")
+
+        else:
+            os.makedirs(dest_path, exist_ok=True)
+            logger.info("Downloading the dataset...")
+            urllib.request.urlretrieve(url, file_path)
+            logger.info('Dataset Downloaded')
+
+        if unzip:
+            StoredDataset.extract_archive(zip_path=file_path, dest_path=dest_path, remove_archive=False)
+
+    @staticmethod
+    def extract_archive(zip_path: str, dest_path=None, remove_archive=False):
+        """
+        Extract dataset from archived file
+        :param zip_path: path to archived file
+        :param dest_path: directory path to uncompress the file to
+        :param remove_archive: whether remove the archive file after uncompress (default False)
+        :return: None
+        """
+        logger.info("Extracting the dataset...")
+        tar = tarfile.open(zip_path)
+        tar.extractall(path=dest_path)
+
+        logger.info("Dataset was extracted to {}".format(dest_path))
+        if remove_archive:
+            logger.info("Removing a zip file")
+            os.remove(zip_path)
+        logger.info("Extracted the dataset")
+
+    @staticmethod
+    def split_debug(datafile: str, dest_datafile: str, ratio: int, shuffle=True, delimiter=",", fmt=None) -> None:
+        """
+        Split the data and take only a part of it
+        :param datafile: dataset file path
+        :param dest_datafile: destination path for the partial dataset file
+        :param ratio: part of the dataset to save
+        :param shuffle: whether to shuffle the data or not (default True)
+        :param delimiter: dataset delimiter (default ",")
+        :param fmt: format for the correct data saving
+        :return: None
+        """
+        if os.path.isfile(dest_datafile):
+            logger.info(f"The partial debug split already exists {dest_datafile}")
+            return
+        else:
+            os.makedirs(os.path.dirname(dest_datafile), exist_ok=True)
+
+        data = np.genfromtxt(datafile, delimiter=delimiter)
+        if shuffle:
+            logger.info("Shuffling data")
+            np.random.shuffle(data)
+
+        debug_data = data[:int(len(data) * ratio)]
+        logger.info(f"Saving {ratio} of the data to {dest_datafile}")
+        np.savetxt(dest_datafile, debug_data, delimiter=delimiter, fmt=fmt)
+
+
+class ArrayDataset(Dataset):
+    """Dataset that is based on x and y arrays (e.g., numpy/pandas/list...)"""
+
+    def __init__(self, x: INPUT_DATA_ARRAY_TYPE, y: Optional[INPUT_DATA_ARRAY_TYPE] = None,
+                 features_names: Optional = None, **kwargs):
+        """
+        ArrayDataset constructor.
+        :param x: collection of data samples
+        :param y: collection of labels (optional)
+        :param feature_names: list of str, The feature names, in the order that they appear in the data (optional)
+        :param kwargs: dataset parameters
+        """
+        self.is_pandas = False
+        self.features_names = features_names
+        self._y = array2numpy(self, y) if y is not None else None
+        self._x = array2numpy(self, x)
+        if self.is_pandas:
+            if features_names and not np.array_equal(features_names, x.columns):
+                raise ValueError("The supplied features are not the same as in the data features")
+            self.features_names = x.columns.to_list()
+
+        if y is not None and len(self._x) != len(self._y):
+            raise ValueError('Non equivalent lengths of x and y')
+
+    def get_samples(self) -> OUTPUT_DATA_ARRAY_TYPE:
+        """Return data samples as numpy array"""
+        return self._x
+
+    def get_labels(self) -> OUTPUT_DATA_ARRAY_TYPE:
+        """Return labels as numpy array"""
+        return self._y
+
+
+class PytorchData(Dataset):
+
+    def __init__(self, x: INPUT_DATA_ARRAY_TYPE, y: Optional[INPUT_DATA_ARRAY_TYPE] = None, **kwargs):
+        """
+        PytorchData constructor.
+        :param x: collection of data samples
+        :param y: collection of labels (optional)
+        :param kwargs: dataset parameters
+        """
+        self.is_pandas = False
+        self._y = array2torch_tensor(self, y) if y is not None else None
+        self._x = array2torch_tensor(self, x)
+        if self.is_pandas:
+            self.features_names = x.columns
+
+        if y is not None and len(self._x) != len(self._y):
+            raise ValueError('Non equivalent lengths of x and y')
+
+
+        if self._y is not None:
+            self.__getitem__ = self.get_item
+        else:
+            self.__getitem__ = self.get_sample_item
+
+
+    def get_samples(self) -> OUTPUT_DATA_ARRAY_TYPE:
+        """Return data samples as numpy array"""
+        return array2numpy(self._x)
+
+    def get_labels(self) -> OUTPUT_DATA_ARRAY_TYPE:
+        """Return labels as numpy array"""
+        return array2numpy(self._y) if self._y is not None else None
+
+    def get_sample_item(self, idx) -> Tensor:
+        return self.x[idx]
+
+    def get_item(self, idx) -> Tensor:
+        sample, label = self.x[idx], self.y[idx]
+        return sample, label
+
+    def __len__(self):
+        return len(self.x)
+
+
+class DatasetFactory:
+    """Factory class for dataset creation"""
+    registry = {}
+
+    @classmethod
+    def register(cls, name: str) -> Callable:
+        """
+        Class method to register Dataset to the internal registry
+        :param name: dataset name
+        :return:
+        """
+
+        def inner_wrapper(wrapped_class: Dataset) -> Any:
+            if name in cls.registry:
+                logger.warning('Dataset %s already exists. Will replace it', name)
+            cls.registry[name] = wrapped_class
+            return wrapped_class
+
+        return inner_wrapper
+
+    @classmethod
+    def create_dataset(cls, name: str, **kwargs) -> Dataset:
+        """
+        Factory command to create dataset instance.
+        This method gets the appropriate Dataset class from the registry
+        and creates an instance of it, while passing in the parameters
+        given in ``kwargs``.
+        :param name: The name of the dataset to create.
+        :param kwargs: dataset parameters
+        :return: An instance of the dataset that is created.
+        """
+        if name not in cls.registry:
+            msg = f'Dataset {name} does not exist in the registry'
+            logger.error(msg)
+            raise ValueError(msg)
+
+        exec_class = cls.registry[name]
+        executor = exec_class(**kwargs)
+        return executor
+
+
+class Data:
+    def __init__(self, train: Dataset = None, test: Dataset = None, **kwargs):
+        """
+        Data class constructor.
+        The class stores train and test datasets.
+        If neither of the datasets was provided,
+        Both train and test datasets will be create using
+        DatasetFactory to create a dataset instance
+        """
+        if train or test:
+            self.train = train
+            self.test = test
+        else:
+            self.train = DatasetFactory.create_dataset(train=True, **kwargs)
+            self.test = DatasetFactory.create_dataset(train=False, **kwargs)
+
+    def get_train_set(self) -> Dataset:
+        """Return train DatasetBase"""
+        return self.train
+
+    def get_test_set(self) -> Dataset:
+        """Return test DatasetBase"""
+        return self.test
+
+    def get_train_samples(self) -> Collection[Any]:
+        """Return train set samples"""
+        return self.train.get_samples()
+
+    def get_train_labels(self) -> Collection[Any]:
+        """Return train set labels"""
+        return self.train.get_labels()
+
+    def get_test_samples(self) -> Collection[Any]:
+        """Return test set samples"""
+        return self.test.get_samples()
+
+    def get_test_labels(self) -> Collection[Any]:
+        """Return test set labels"""
+        return self.test.get_labels()
diff --git a/apt/utils/models/__init__.py b/apt/utils/models/__init__.py
new file mode 100644
index 0000000..11efd5f
--- /dev/null
+++ b/apt/utils/models/__init__.py
@@ -0,0 +1,2 @@
+from apt.utils.models.model import Model, ModelOutputType
+from apt.utils.models.sklearn_model import SklearnModel, SklearnClassifier, SklearnRegressor
diff --git a/apt/utils/models/model.py b/apt/utils/models/model.py
new file mode 100644
index 0000000..9616459
--- /dev/null
+++ b/apt/utils/models/model.py
@@ -0,0 +1,109 @@
+from abc import ABCMeta, abstractmethod
+from typing import Any, Optional
+from enum import Enum, auto
+
+from apt.utils.datasets import Dataset, OUTPUT_DATA_ARRAY_TYPE
+
+
+class ModelOutputType(Enum):
+    CLASSIFIER_VECTOR = auto()  # probabilities or logits
+    CLASSIFIER_SCALAR = auto()  # label only
+    REGRESSOR_SCALAR = auto()  # value
+
+
+class Model(metaclass=ABCMeta):
+    """
+    Abstract base class for ML model wrappers.
+    """
+
+    def __init__(self, model: Any, output_type: ModelOutputType, black_box_access: Optional[bool] = True,
+                 unlimited_queries: Optional[bool] = True, **kwargs):
+        """
+        Initialize a `Model` wrapper object.
+
+        :param model: The original model object (of the underlying ML framework)
+        :param output_type: The type of output the model yields (vector/label only for classifiers,
+                            value for regressors)
+        :param black_box_access: Boolean describing the type of deployment of the model (when in production).
+                                 Set to True if the model is only available via query (API) access, i.e.,
+                                 only the outputs of the model are exposed, and False if the model internals
+                                 are also available. Optional, Default is True.
+        :param unlimited_queries: If black_box_access is True, this boolean indicates whether a user can perform
+                                  unlimited queries to the model API or whether there is a limit to the number of
+                                  queries that can be submitted. Optional, Default is True.
+        """
+        self._model = model
+        self._output_type = output_type
+        self._black_box_access = black_box_access
+        self._unlimited_queries = unlimited_queries
+
+    @abstractmethod
+    def fit(self, train_data: Dataset, **kwargs) -> None:
+        """
+        Fit the model using the training data.
+
+        :param train_data: Training data.
+        :type train_data: `Dataset`
+        """
+        raise NotImplementedError
+
+    @abstractmethod
+    def predict(self, x: Dataset, **kwargs) -> OUTPUT_DATA_ARRAY_TYPE:
+        """
+        Perform predictions using the model for input `x`.
+
+        :param x: Input samples.
+        :type x: `np.ndarray` or `pandas.DataFrame`
+        :return: Predictions from the model.
+        """
+        raise NotImplementedError
+
+    @abstractmethod
+    def score(self, test_data: Dataset, **kwargs):
+        """
+        Score the model using test data.
+
+        :param test_data: Test data.
+        :type train_data: `Dataset`
+        """
+        return NotImplementedError
+
+    @property
+    def model(self) -> Any:
+        """
+        Return the model.
+
+        :return: The model.
+        """
+        return self._model
+
+    @property
+    def output_type(self) -> ModelOutputType:
+        """
+        Return the model's output type.
+
+        :return: The model's output type.
+        """
+        return self._output_type
+
+    @property
+    def black_box_access(self) -> bool:
+        """
+        Return True if the model is only available via query (API) access, i.e.,
+        only the outputs of the model are exposed, and False if the model internals are also available.
+
+        :return: True if the model is only available via query (API) access, i.e.,
+                 only the outputs of the model are exposed, and False if the model internals are also available.
+        """
+        return self._black_box_access
+
+    @property
+    def unlimited_queries(self) -> bool:
+        """
+        If black_box_access is True, Return whether a user can perform unlimited queries to the model API
+        or whether there is a limit to the number of queries that can be submitted.
+
+        :return: If black_box_access is True, Return whether a user can perform unlimited queries to the model API
+                 or whether there is a limit to the number of queries that can be submitted.
+        """
+        return self._unlimited_queries
diff --git a/apt/utils/models/sklearn_model.py b/apt/utils/models/sklearn_model.py
new file mode 100644
index 0000000..f7afaa6
--- /dev/null
+++ b/apt/utils/models/sklearn_model.py
@@ -0,0 +1,112 @@
+from typing import Optional
+
+import numpy as np
+
+from sklearn.preprocessing import OneHotEncoder
+from sklearn.base import BaseEstimator
+
+from apt.utils.models import Model, ModelOutputType
+from apt.utils.datasets import Dataset, OUTPUT_DATA_ARRAY_TYPE
+
+from art.estimators.classification.scikitlearn import SklearnClassifier as ArtSklearnClassifier
+from art.estimators.regression.scikitlearn import ScikitlearnRegressor
+
+
+class SklearnModel(Model):
+    """
+    Wrapper class for scikitlearn models.
+    """
+    def score(self, test_data: Dataset, **kwargs):
+        """
+        Score the model using test data.
+
+        :param test_data: Test data.
+        :type train_data: `Dataset`
+        """
+        return self.model.score(test_data.get_samples(), test_data.get_labels(), **kwargs)
+
+
+class SklearnClassifier(SklearnModel):
+    """
+    Wrapper class for scikitlearn classification models.
+    """
+    def __init__(self, model: BaseEstimator, output_type: ModelOutputType, black_box_access: Optional[bool] = True,
+                 unlimited_queries: Optional[bool] = True, **kwargs):
+        """
+        Initialize a `SklearnClassifier` wrapper object.
+
+        :param model: The original sklearn model object.
+        :param output_type: The type of output the model yields (vector/label only for classifiers,
+                            value for regressors)
+        :param black_box_access: Boolean describing the type of deployment of the model (when in production).
+                                 Set to True if the model is only available via query (API) access, i.e.,
+                                 only the outputs of the model are exposed, and False if the model internals
+                                 are also available. Optional, Default is True.
+        :param unlimited_queries: If black_box_access is True, this boolean indicates whether a user can perform
+                                  unlimited queries to the model API or whether there is a limit to the number of
+                                  queries that can be submitted. Optional, Default is True.
+        """
+        super().__init__(model, output_type, black_box_access, unlimited_queries, **kwargs)
+        self._art_model = ArtSklearnClassifier(model)
+
+    def fit(self, train_data: Dataset, **kwargs) -> None:
+        """
+        Fit the model using the training data.
+
+        :param train_data: Training data.
+        :type train_data: `Dataset`
+        """
+        encoder = OneHotEncoder(sparse=False)
+        y_encoded = encoder.fit_transform(train_data.get_labels().reshape(-1, 1))
+        self._art_model.fit(train_data.get_samples(), y_encoded, **kwargs)
+
+    def predict(self, x: Dataset, **kwargs) -> OUTPUT_DATA_ARRAY_TYPE:
+        """
+        Perform predictions using the model for input `x`.
+
+        :param x: Input samples.
+        :type x: `np.ndarray` or `pandas.DataFrame`
+        :return: Predictions from the model (class probabilities, if supported).
+        """
+        return self._art_model.predict(x, **kwargs)
+
+
+class SklearnRegressor(SklearnModel):
+    """
+    Wrapper class for scikitlearn regression models.
+    """
+    def __init__(self, model: BaseEstimator, black_box_access: Optional[bool] = True,
+                 unlimited_queries: Optional[bool] = True, **kwargs):
+        """
+        Initialize a `SklearnRegressor` wrapper object.
+
+        :param model: The original sklearn model object.
+        :param black_box_access: Boolean describing the type of deployment of the model (when in production).
+                                 Set to True if the model is only available via query (API) access, i.e.,
+                                 only the outputs of the model are exposed, and False if the model internals
+                                 are also available. Optional, Default is True.
+        :param unlimited_queries: If black_box_access is True, this boolean indicates whether a user can perform
+                                  unlimited queries to the model API or whether there is a limit to the number of
+                                  queries that can be submitted. Optional, Default is True.
+        """
+        super().__init__(model, ModelOutputType.REGRESSOR_SCALAR, black_box_access, unlimited_queries, **kwargs)
+        self._art_model = ScikitlearnRegressor(model)
+
+    def fit(self, train_data: Dataset, **kwargs) -> None:
+        """
+        Fit the model using the training data.
+
+        :param train_data: Training data.
+        :type train_data: `Dataset`
+        """
+        self._art_model.fit(train_data.get_samples(), train_data.get_labels(), **kwargs)
+
+    def predict(self, x: Dataset, **kwargs) -> OUTPUT_DATA_ARRAY_TYPE:
+        """
+        Perform predictions using the model for input `x`.
+
+        :param x: Input samples.
+        :type x: `np.ndarray` or `pandas.DataFrame`
+        :return: Predictions from the model.
+        """
+        return self._art_model.predict(x, **kwargs)
diff --git a/notebooks/attribute_inference_anonymization_nursery.ipynb b/notebooks/attribute_inference_anonymization_nursery.ipynb
index 9952885..bfba540 100644
--- a/notebooks/attribute_inference_anonymization_nursery.ipynb
+++ b/notebooks/attribute_inference_anonymization_nursery.ipynb
@@ -29,198 +29,15 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 61,
+   "execution_count": 1,
    "metadata": {},
    "outputs": [
     {
      "data": {
-      "text/html": [
-       "<div>\n",
-       "<style scoped>\n",
-       "    .dataframe tbody tr th:only-of-type {\n",
-       "        vertical-align: middle;\n",
-       "    }\n",
-       "\n",
-       "    .dataframe tbody tr th {\n",
-       "        vertical-align: top;\n",
-       "    }\n",
-       "\n",
-       "    .dataframe thead th {\n",
-       "        text-align: right;\n",
-       "    }\n",
-       "</style>\n",
-       "<table border=\"1\" class=\"dataframe\">\n",
-       "  <thead>\n",
-       "    <tr style=\"text-align: right;\">\n",
-       "      <th></th>\n",
-       "      <th>parents</th>\n",
-       "      <th>has_nurs</th>\n",
-       "      <th>form</th>\n",
-       "      <th>children</th>\n",
-       "      <th>housing</th>\n",
-       "      <th>finance</th>\n",
-       "      <th>social</th>\n",
-       "      <th>health</th>\n",
-       "    </tr>\n",
-       "  </thead>\n",
-       "  <tbody>\n",
-       "    <tr>\n",
-       "      <th>8450</th>\n",
-       "      <td>pretentious</td>\n",
-       "      <td>very_crit</td>\n",
-       "      <td>foster</td>\n",
-       "      <td>1</td>\n",
-       "      <td>less_conv</td>\n",
-       "      <td>convenient</td>\n",
-       "      <td>1</td>\n",
-       "      <td>not_recom</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>12147</th>\n",
-       "      <td>great_pret</td>\n",
-       "      <td>very_crit</td>\n",
-       "      <td>complete</td>\n",
-       "      <td>1</td>\n",
-       "      <td>critical</td>\n",
-       "      <td>inconv</td>\n",
-       "      <td>1</td>\n",
-       "      <td>recommended</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>2780</th>\n",
-       "      <td>usual</td>\n",
-       "      <td>critical</td>\n",
-       "      <td>complete</td>\n",
-       "      <td>4</td>\n",
-       "      <td>less_conv</td>\n",
-       "      <td>convenient</td>\n",
-       "      <td>1</td>\n",
-       "      <td>not_recom</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>11924</th>\n",
-       "      <td>great_pret</td>\n",
-       "      <td>critical</td>\n",
-       "      <td>foster</td>\n",
-       "      <td>1</td>\n",
-       "      <td>critical</td>\n",
-       "      <td>convenient</td>\n",
-       "      <td>1</td>\n",
-       "      <td>not_recom</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>59</th>\n",
-       "      <td>usual</td>\n",
-       "      <td>proper</td>\n",
-       "      <td>complete</td>\n",
-       "      <td>2</td>\n",
-       "      <td>convenient</td>\n",
-       "      <td>convenient</td>\n",
-       "      <td>0</td>\n",
-       "      <td>not_recom</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>...</th>\n",
-       "      <td>...</td>\n",
-       "      <td>...</td>\n",
-       "      <td>...</td>\n",
-       "      <td>...</td>\n",
-       "      <td>...</td>\n",
-       "      <td>...</td>\n",
-       "      <td>...</td>\n",
-       "      <td>...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>5193</th>\n",
-       "      <td>pretentious</td>\n",
-       "      <td>less_proper</td>\n",
-       "      <td>complete</td>\n",
-       "      <td>1</td>\n",
-       "      <td>convenient</td>\n",
-       "      <td>inconv</td>\n",
-       "      <td>0</td>\n",
-       "      <td>recommended</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>1375</th>\n",
-       "      <td>usual</td>\n",
-       "      <td>less_proper</td>\n",
-       "      <td>incomplete</td>\n",
-       "      <td>2</td>\n",
-       "      <td>less_conv</td>\n",
-       "      <td>convenient</td>\n",
-       "      <td>1</td>\n",
-       "      <td>priority</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>10318</th>\n",
-       "      <td>great_pret</td>\n",
-       "      <td>less_proper</td>\n",
-       "      <td>foster</td>\n",
-       "      <td>4</td>\n",
-       "      <td>convenient</td>\n",
-       "      <td>convenient</td>\n",
-       "      <td>0</td>\n",
-       "      <td>priority</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>6396</th>\n",
-       "      <td>pretentious</td>\n",
-       "      <td>improper</td>\n",
-       "      <td>completed</td>\n",
-       "      <td>3</td>\n",
-       "      <td>less_conv</td>\n",
-       "      <td>convenient</td>\n",
-       "      <td>1</td>\n",
-       "      <td>recommended</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>485</th>\n",
-       "      <td>usual</td>\n",
-       "      <td>proper</td>\n",
-       "      <td>incomplete</td>\n",
-       "      <td>1</td>\n",
-       "      <td>critical</td>\n",
-       "      <td>inconv</td>\n",
-       "      <td>1</td>\n",
-       "      <td>not_recom</td>\n",
-       "    </tr>\n",
-       "  </tbody>\n",
-       "</table>\n",
-       "<p>10366 rows × 8 columns</p>\n",
-       "</div>"
-      ],
-      "text/plain": [
-       "           parents     has_nurs        form children     housing     finance  \\\n",
-       "8450   pretentious    very_crit      foster        1   less_conv  convenient   \n",
-       "12147   great_pret    very_crit    complete        1    critical      inconv   \n",
-       "2780         usual     critical    complete        4   less_conv  convenient   \n",
-       "11924   great_pret     critical      foster        1    critical  convenient   \n",
-       "59           usual       proper    complete        2  convenient  convenient   \n",
-       "...            ...          ...         ...      ...         ...         ...   \n",
-       "5193   pretentious  less_proper    complete        1  convenient      inconv   \n",
-       "1375         usual  less_proper  incomplete        2   less_conv  convenient   \n",
-       "10318   great_pret  less_proper      foster        4  convenient  convenient   \n",
-       "6396   pretentious     improper   completed        3   less_conv  convenient   \n",
-       "485          usual       proper  incomplete        1    critical      inconv   \n",
-       "\n",
-       "       social       health  \n",
-       "8450        1    not_recom  \n",
-       "12147       1  recommended  \n",
-       "2780        1    not_recom  \n",
-       "11924       1    not_recom  \n",
-       "59          0    not_recom  \n",
-       "...       ...          ...  \n",
-       "5193        0  recommended  \n",
-       "1375        1     priority  \n",
-       "10318       0     priority  \n",
-       "6396        1  recommended  \n",
-       "485         1    not_recom  \n",
-       "\n",
-       "[10366 rows x 8 columns]"
-      ]
+      "text/plain": "           parents     has_nurs        form children     housing     finance  \\\n8450   pretentious    very_crit      foster        1   less_conv  convenient   \n12147   great_pret    very_crit    complete        1    critical      inconv   \n2780         usual     critical    complete        4   less_conv  convenient   \n11924   great_pret     critical      foster        1    critical  convenient   \n59           usual       proper    complete        2  convenient  convenient   \n...            ...          ...         ...      ...         ...         ...   \n5193   pretentious  less_proper    complete        1  convenient      inconv   \n1375         usual  less_proper  incomplete        2   less_conv  convenient   \n10318   great_pret  less_proper      foster        4  convenient  convenient   \n6396   pretentious     improper   completed        3   less_conv  convenient   \n485          usual       proper  incomplete        1    critical      inconv   \n\n       social       health  \n8450        1    not_recom  \n12147       1  recommended  \n2780        1    not_recom  \n11924       1    not_recom  \n59          0    not_recom  \n...       ...          ...  \n5193        0  recommended  \n1375        1     priority  \n10318       0     priority  \n6396        1  recommended  \n485         1    not_recom  \n\n[10366 rows x 8 columns]",
+      "text/html": "<div>\n<style scoped>\n    .dataframe tbody tr th:only-of-type {\n        vertical-align: middle;\n    }\n\n    .dataframe tbody tr th {\n        vertical-align: top;\n    }\n\n    .dataframe thead th {\n        text-align: right;\n    }\n</style>\n<table border=\"1\" class=\"dataframe\">\n  <thead>\n    <tr style=\"text-align: right;\">\n      <th></th>\n      <th>parents</th>\n      <th>has_nurs</th>\n      <th>form</th>\n      <th>children</th>\n      <th>housing</th>\n      <th>finance</th>\n      <th>social</th>\n      <th>health</th>\n    </tr>\n  </thead>\n  <tbody>\n    <tr>\n      <th>8450</th>\n      <td>pretentious</td>\n      <td>very_crit</td>\n      <td>foster</td>\n      <td>1</td>\n      <td>less_conv</td>\n      <td>convenient</td>\n      <td>1</td>\n      <td>not_recom</td>\n    </tr>\n    <tr>\n      <th>12147</th>\n      <td>great_pret</td>\n      <td>very_crit</td>\n      <td>complete</td>\n      <td>1</td>\n      <td>critical</td>\n      <td>inconv</td>\n      <td>1</td>\n      <td>recommended</td>\n    </tr>\n    <tr>\n      <th>2780</th>\n      <td>usual</td>\n      <td>critical</td>\n      <td>complete</td>\n      <td>4</td>\n      <td>less_conv</td>\n      <td>convenient</td>\n      <td>1</td>\n      <td>not_recom</td>\n    </tr>\n    <tr>\n      <th>11924</th>\n      <td>great_pret</td>\n      <td>critical</td>\n      <td>foster</td>\n      <td>1</td>\n      <td>critical</td>\n      <td>convenient</td>\n      <td>1</td>\n      <td>not_recom</td>\n    </tr>\n    <tr>\n      <th>59</th>\n      <td>usual</td>\n      <td>proper</td>\n      <td>complete</td>\n      <td>2</td>\n      <td>convenient</td>\n      <td>convenient</td>\n      <td>0</td>\n      <td>not_recom</td>\n    </tr>\n    <tr>\n      <th>...</th>\n      <td>...</td>\n      <td>...</td>\n      <td>...</td>\n      <td>...</td>\n      <td>...</td>\n      <td>...</td>\n      <td>...</td>\n      <td>...</td>\n    </tr>\n    <tr>\n      <th>5193</th>\n      <td>pretentious</td>\n      <td>less_proper</td>\n      <td>complete</td>\n      <td>1</td>\n      <td>convenient</td>\n      <td>inconv</td>\n      <td>0</td>\n      <td>recommended</td>\n    </tr>\n    <tr>\n      <th>1375</th>\n      <td>usual</td>\n      <td>less_proper</td>\n      <td>incomplete</td>\n      <td>2</td>\n      <td>less_conv</td>\n      <td>convenient</td>\n      <td>1</td>\n      <td>priority</td>\n    </tr>\n    <tr>\n      <th>10318</th>\n      <td>great_pret</td>\n      <td>less_proper</td>\n      <td>foster</td>\n      <td>4</td>\n      <td>convenient</td>\n      <td>convenient</td>\n      <td>0</td>\n      <td>priority</td>\n    </tr>\n    <tr>\n      <th>6396</th>\n      <td>pretentious</td>\n      <td>improper</td>\n      <td>completed</td>\n      <td>3</td>\n      <td>less_conv</td>\n      <td>convenient</td>\n      <td>1</td>\n      <td>recommended</td>\n    </tr>\n    <tr>\n      <th>485</th>\n      <td>usual</td>\n      <td>proper</td>\n      <td>incomplete</td>\n      <td>1</td>\n      <td>critical</td>\n      <td>inconv</td>\n      <td>1</td>\n      <td>not_recom</td>\n    </tr>\n  </tbody>\n</table>\n<p>10366 rows × 8 columns</p>\n</div>"
      },
-     "execution_count": 61,
+     "execution_count": 1,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -230,7 +47,7 @@
     "import sys\n",
     "sys.path.insert(0, os.path.abspath('..'))\n",
     "\n",
-    "from apt.utils import get_nursery_dataset\n",
+    "from apt.utils.dataset_utils import get_nursery_dataset\n",
     "\n",
     "(x_train, y_train), (x_test, y_test) = get_nursery_dataset(transform_social=True)\n",
     "\n",
@@ -246,7 +63,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 62,
+   "execution_count": 2,
    "metadata": {},
    "outputs": [
     {
@@ -263,9 +80,9 @@
     "from sklearn.preprocessing import OneHotEncoder\n",
     "\n",
     "x_train_str = x_train.astype(str)\n",
-    "train_encoded = OneHotEncoder(sparse=False, drop='if_binary').fit_transform(x_train_str)\n",
+    "train_encoded = OneHotEncoder(sparse=False).fit_transform(x_train_str)\n",
     "x_test_str = x_test.astype(str)\n",
-    "test_encoded = OneHotEncoder(sparse=False, drop='if_binary').fit_transform(x_test_str)\n",
+    "test_encoded = OneHotEncoder(sparse=False).fit_transform(x_test_str)\n",
     "    \n",
     "model = DecisionTreeClassifier()\n",
     "model.fit(train_encoded, y_train)\n",
@@ -287,7 +104,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 91,
+   "execution_count": 3,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -323,14 +140,14 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 96,
+   "execution_count": 4,
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "0.6430638626278217\n"
+      "1.0\n"
      ]
     }
    ],
@@ -361,14 +178,14 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 55,
+   "execution_count": 5,
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "0.6980513216284006\n"
+      "0.5122515917422342\n"
      ]
     }
    ],
@@ -408,224 +225,43 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 97,
+   "execution_count": 6,
    "metadata": {},
    "outputs": [
     {
      "data": {
-      "text/html": [
-       "<div>\n",
-       "<style scoped>\n",
-       "    .dataframe tbody tr th:only-of-type {\n",
-       "        vertical-align: middle;\n",
-       "    }\n",
-       "\n",
-       "    .dataframe tbody tr th {\n",
-       "        vertical-align: top;\n",
-       "    }\n",
-       "\n",
-       "    .dataframe thead th {\n",
-       "        text-align: right;\n",
-       "    }\n",
-       "</style>\n",
-       "<table border=\"1\" class=\"dataframe\">\n",
-       "  <thead>\n",
-       "    <tr style=\"text-align: right;\">\n",
-       "      <th></th>\n",
-       "      <th>parents</th>\n",
-       "      <th>has_nurs</th>\n",
-       "      <th>form</th>\n",
-       "      <th>children</th>\n",
-       "      <th>housing</th>\n",
-       "      <th>finance</th>\n",
-       "      <th>social</th>\n",
-       "      <th>health</th>\n",
-       "    </tr>\n",
-       "  </thead>\n",
-       "  <tbody>\n",
-       "    <tr>\n",
-       "      <th>8450</th>\n",
-       "      <td>pretentious</td>\n",
-       "      <td>very_crit</td>\n",
-       "      <td>foster</td>\n",
-       "      <td>1</td>\n",
-       "      <td>less_conv</td>\n",
-       "      <td>convenient</td>\n",
-       "      <td>0</td>\n",
-       "      <td>not_recom</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>12147</th>\n",
-       "      <td>great_pret</td>\n",
-       "      <td>very_crit</td>\n",
-       "      <td>complete</td>\n",
-       "      <td>1</td>\n",
-       "      <td>critical</td>\n",
-       "      <td>inconv</td>\n",
-       "      <td>1</td>\n",
-       "      <td>recommended</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>2780</th>\n",
-       "      <td>usual</td>\n",
-       "      <td>critical</td>\n",
-       "      <td>complete</td>\n",
-       "      <td>4</td>\n",
-       "      <td>less_conv</td>\n",
-       "      <td>convenient</td>\n",
-       "      <td>0</td>\n",
-       "      <td>not_recom</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>11924</th>\n",
-       "      <td>great_pret</td>\n",
-       "      <td>critical</td>\n",
-       "      <td>foster</td>\n",
-       "      <td>1</td>\n",
-       "      <td>critical</td>\n",
-       "      <td>convenient</td>\n",
-       "      <td>0</td>\n",
-       "      <td>not_recom</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>59</th>\n",
-       "      <td>usual</td>\n",
-       "      <td>proper</td>\n",
-       "      <td>complete</td>\n",
-       "      <td>2</td>\n",
-       "      <td>convenient</td>\n",
-       "      <td>convenient</td>\n",
-       "      <td>0</td>\n",
-       "      <td>not_recom</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>...</th>\n",
-       "      <td>...</td>\n",
-       "      <td>...</td>\n",
-       "      <td>...</td>\n",
-       "      <td>...</td>\n",
-       "      <td>...</td>\n",
-       "      <td>...</td>\n",
-       "      <td>...</td>\n",
-       "      <td>...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>5193</th>\n",
-       "      <td>pretentious</td>\n",
-       "      <td>less_proper</td>\n",
-       "      <td>complete</td>\n",
-       "      <td>1</td>\n",
-       "      <td>convenient</td>\n",
-       "      <td>inconv</td>\n",
-       "      <td>0</td>\n",
-       "      <td>recommended</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>1375</th>\n",
-       "      <td>usual</td>\n",
-       "      <td>less_proper</td>\n",
-       "      <td>incomplete</td>\n",
-       "      <td>2</td>\n",
-       "      <td>less_conv</td>\n",
-       "      <td>convenient</td>\n",
-       "      <td>1</td>\n",
-       "      <td>priority</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>10318</th>\n",
-       "      <td>great_pret</td>\n",
-       "      <td>less_proper</td>\n",
-       "      <td>foster</td>\n",
-       "      <td>4</td>\n",
-       "      <td>convenient</td>\n",
-       "      <td>convenient</td>\n",
-       "      <td>0</td>\n",
-       "      <td>priority</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>6396</th>\n",
-       "      <td>pretentious</td>\n",
-       "      <td>improper</td>\n",
-       "      <td>completed</td>\n",
-       "      <td>3</td>\n",
-       "      <td>less_conv</td>\n",
-       "      <td>convenient</td>\n",
-       "      <td>1</td>\n",
-       "      <td>recommended</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>485</th>\n",
-       "      <td>usual</td>\n",
-       "      <td>proper</td>\n",
-       "      <td>incomplete</td>\n",
-       "      <td>1</td>\n",
-       "      <td>critical</td>\n",
-       "      <td>convenient</td>\n",
-       "      <td>0</td>\n",
-       "      <td>not_recom</td>\n",
-       "    </tr>\n",
-       "  </tbody>\n",
-       "</table>\n",
-       "<p>10366 rows × 8 columns</p>\n",
-       "</div>"
-      ],
-      "text/plain": [
-       "           parents     has_nurs        form children     housing     finance  \\\n",
-       "8450   pretentious    very_crit      foster        1   less_conv  convenient   \n",
-       "12147   great_pret    very_crit    complete        1    critical      inconv   \n",
-       "2780         usual     critical    complete        4   less_conv  convenient   \n",
-       "11924   great_pret     critical      foster        1    critical  convenient   \n",
-       "59           usual       proper    complete        2  convenient  convenient   \n",
-       "...            ...          ...         ...      ...         ...         ...   \n",
-       "5193   pretentious  less_proper    complete        1  convenient      inconv   \n",
-       "1375         usual  less_proper  incomplete        2   less_conv  convenient   \n",
-       "10318   great_pret  less_proper      foster        4  convenient  convenient   \n",
-       "6396   pretentious     improper   completed        3   less_conv  convenient   \n",
-       "485          usual       proper  incomplete        1    critical  convenient   \n",
-       "\n",
-       "       social       health  \n",
-       "8450        0    not_recom  \n",
-       "12147       1  recommended  \n",
-       "2780        0    not_recom  \n",
-       "11924       0    not_recom  \n",
-       "59          0    not_recom  \n",
-       "...       ...          ...  \n",
-       "5193        0  recommended  \n",
-       "1375        1     priority  \n",
-       "10318       0     priority  \n",
-       "6396        1  recommended  \n",
-       "485         0    not_recom  \n",
-       "\n",
-       "[10366 rows x 8 columns]"
-      ]
+      "text/plain": "           parents     has_nurs        form children     housing     finance  \\\n0      pretentious    very_crit      foster        1   less_conv  convenient   \n1       great_pret    very_crit    complete        1    critical      inconv   \n2            usual     critical    complete        4   less_conv  convenient   \n3       great_pret     critical      foster        1    critical  convenient   \n4            usual       proper    complete        2  convenient  convenient   \n...            ...          ...         ...      ...         ...         ...   \n10361  pretentious  less_proper    complete        1  convenient      inconv   \n10362        usual  less_proper  incomplete        2   less_conv  convenient   \n10363   great_pret  less_proper      foster        4  convenient  convenient   \n10364  pretentious     improper   completed        3   less_conv  convenient   \n10365        usual       proper  incomplete        1    critical  convenient   \n\n      social       health  \n0          0    not_recom  \n1          1  recommended  \n2          0    not_recom  \n3          0    not_recom  \n4          0    not_recom  \n...      ...          ...  \n10361      0  recommended  \n10362      1     priority  \n10363      0     priority  \n10364      1  recommended  \n10365      0    not_recom  \n\n[10366 rows x 8 columns]",
+      "text/html": "<div>\n<style scoped>\n    .dataframe tbody tr th:only-of-type {\n        vertical-align: middle;\n    }\n\n    .dataframe tbody tr th {\n        vertical-align: top;\n    }\n\n    .dataframe thead th {\n        text-align: right;\n    }\n</style>\n<table border=\"1\" class=\"dataframe\">\n  <thead>\n    <tr style=\"text-align: right;\">\n      <th></th>\n      <th>parents</th>\n      <th>has_nurs</th>\n      <th>form</th>\n      <th>children</th>\n      <th>housing</th>\n      <th>finance</th>\n      <th>social</th>\n      <th>health</th>\n    </tr>\n  </thead>\n  <tbody>\n    <tr>\n      <th>0</th>\n      <td>pretentious</td>\n      <td>very_crit</td>\n      <td>foster</td>\n      <td>1</td>\n      <td>less_conv</td>\n      <td>convenient</td>\n      <td>0</td>\n      <td>not_recom</td>\n    </tr>\n    <tr>\n      <th>1</th>\n      <td>great_pret</td>\n      <td>very_crit</td>\n      <td>complete</td>\n      <td>1</td>\n      <td>critical</td>\n      <td>inconv</td>\n      <td>1</td>\n      <td>recommended</td>\n    </tr>\n    <tr>\n      <th>2</th>\n      <td>usual</td>\n      <td>critical</td>\n      <td>complete</td>\n      <td>4</td>\n      <td>less_conv</td>\n      <td>convenient</td>\n      <td>0</td>\n      <td>not_recom</td>\n    </tr>\n    <tr>\n      <th>3</th>\n      <td>great_pret</td>\n      <td>critical</td>\n      <td>foster</td>\n      <td>1</td>\n      <td>critical</td>\n      <td>convenient</td>\n      <td>0</td>\n      <td>not_recom</td>\n    </tr>\n    <tr>\n      <th>4</th>\n      <td>usual</td>\n      <td>proper</td>\n      <td>complete</td>\n      <td>2</td>\n      <td>convenient</td>\n      <td>convenient</td>\n      <td>0</td>\n      <td>not_recom</td>\n    </tr>\n    <tr>\n      <th>...</th>\n      <td>...</td>\n      <td>...</td>\n      <td>...</td>\n      <td>...</td>\n      <td>...</td>\n      <td>...</td>\n      <td>...</td>\n      <td>...</td>\n    </tr>\n    <tr>\n      <th>10361</th>\n      <td>pretentious</td>\n      <td>less_proper</td>\n      <td>complete</td>\n      <td>1</td>\n      <td>convenient</td>\n      <td>inconv</td>\n      <td>0</td>\n      <td>recommended</td>\n    </tr>\n    <tr>\n      <th>10362</th>\n      <td>usual</td>\n      <td>less_proper</td>\n      <td>incomplete</td>\n      <td>2</td>\n      <td>less_conv</td>\n      <td>convenient</td>\n      <td>1</td>\n      <td>priority</td>\n    </tr>\n    <tr>\n      <th>10363</th>\n      <td>great_pret</td>\n      <td>less_proper</td>\n      <td>foster</td>\n      <td>4</td>\n      <td>convenient</td>\n      <td>convenient</td>\n      <td>0</td>\n      <td>priority</td>\n    </tr>\n    <tr>\n      <th>10364</th>\n      <td>pretentious</td>\n      <td>improper</td>\n      <td>completed</td>\n      <td>3</td>\n      <td>less_conv</td>\n      <td>convenient</td>\n      <td>1</td>\n      <td>recommended</td>\n    </tr>\n    <tr>\n      <th>10365</th>\n      <td>usual</td>\n      <td>proper</td>\n      <td>incomplete</td>\n      <td>1</td>\n      <td>critical</td>\n      <td>convenient</td>\n      <td>0</td>\n      <td>not_recom</td>\n    </tr>\n  </tbody>\n</table>\n<p>10366 rows × 8 columns</p>\n</div>"
      },
-     "execution_count": 97,
+     "execution_count": 6,
      "metadata": {},
      "output_type": "execute_result"
     }
    ],
    "source": [
+    "from apt.utils.datasets import ArrayDataset\n",
     "from apt.anonymization import Anonymize\n",
     "\n",
+    "features = x_train.columns\n",
     "QI = [\"finance\", \"social\", \"health\"]\n",
     "categorical_features = [\"parents\", \"has_nurs\", \"form\", \"housing\", \"finance\", \"health\", 'children']\n",
-    "anonymizer = Anonymize(100, QI, categorical_features=categorical_features)\n",
-    "anon = anonymizer.anonymize(x_train, x_train_predictions)\n",
-    "anon"
+    "QI_indexes = [i for i, v in enumerate(features) if v in QI]\n",
+    "categorical_features_indexes = [i for i, v in enumerate(features) if v in categorical_features]\n",
+    "anonymizer = Anonymize(100, QI_indexes, categorical_features=categorical_features_indexes)\n",
+    "anon = anonymizer.anonymize(ArrayDataset(x_train, x_train_predictions))\n",
+    "anon\n"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 64,
+   "execution_count": 7,
    "metadata": {},
    "outputs": [
     {
      "data": {
-      "text/plain": [
-       "7585"
-      ]
+      "text/plain": "7585"
      },
-     "execution_count": 64,
+     "execution_count": 7,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -637,16 +273,14 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 65,
+   "execution_count": 8,
    "metadata": {},
    "outputs": [
     {
      "data": {
-      "text/plain": [
-       "5766"
-      ]
+      "text/plain": "5766"
      },
-     "execution_count": 65,
+     "execution_count": 8,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -665,7 +299,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 66,
+   "execution_count": 9,
    "metadata": {},
    "outputs": [
     {
@@ -678,7 +312,7 @@
    ],
    "source": [
     "anon_str = anon.astype(str)\n",
-    "anon_encoded = OneHotEncoder(sparse=False, drop='if_binary').fit_transform(anon_str)\n",
+    "anon_encoded = OneHotEncoder(sparse=False).fit_transform(anon_str)\n",
     "\n",
     "anon_model = DecisionTreeClassifier()\n",
     "anon_model.fit(anon_encoded, y_train)\n",
@@ -698,14 +332,14 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 98,
+   "execution_count": 10,
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "0.6471155701331275\n"
+      "1.0\n"
      ]
     }
    ],
@@ -734,14 +368,14 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 69,
+   "execution_count": 11,
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "0.6982442600810341\n"
+      "0.5245996527107852\n"
      ]
     }
    ],
@@ -765,15 +399,15 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 87,
+   "execution_count": 12,
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "(0.33056202194878614, 0.2888695146759663)\n",
-      "(0.34112301200908796, 0.3054344667247893)\n"
+      "(0.49415432579890883, 0.48976438779451525)\n",
+      "(0.49415432579890883, 0.48976438779451525)\n"
      ]
     }
    ],
@@ -810,15 +444,15 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 88,
+   "execution_count": 13,
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "(0.6457357075913777, 0.2002324905550712)\n",
-      "(0.6472248353715898, 0.1999418773612322)\n"
+      "(1.0, 0.019204655674102813)\n",
+      "(0.9829787234042553, 0.04481086323957323)\n"
      ]
     }
    ],
@@ -849,26 +483,24 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 74,
+   "execution_count": 14,
    "metadata": {},
    "outputs": [],
    "source": [
-    "anonymizer2 = Anonymize(1000, QI, categorical_features=categorical_features)\n",
-    "anon2 = anonymizer2.anonymize(x_train, x_train_predictions)"
+    "anonymizer2 = Anonymize(1000, QI_indexes, categorical_features=categorical_features_indexes)\n",
+    "anon2 = anonymizer2.anonymize(ArrayDataset(x_train, x_train_predictions))"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 75,
+   "execution_count": 15,
    "metadata": {},
    "outputs": [
     {
      "data": {
-      "text/plain": [
-       "4226"
-      ]
+      "text/plain": "4226"
      },
-     "execution_count": 75,
+     "execution_count": 15,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -887,7 +519,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 104,
+   "execution_count": 16,
    "metadata": {},
    "outputs": [
     {
@@ -900,7 +532,7 @@
    ],
    "source": [
     "anon2_str = anon2.astype(str)\n",
-    "anon2_encoded = OneHotEncoder(sparse=False, drop='if_binary').fit_transform(anon2_str)\n",
+    "anon2_encoded = OneHotEncoder(sparse=False).fit_transform(anon2_str)\n",
     "\n",
     "anon2_model = DecisionTreeClassifier()\n",
     "anon2_model.fit(anon2_encoded, y_train)\n",
@@ -920,14 +552,14 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 105,
+   "execution_count": 17,
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "0.6266640941539648\n"
+      "1.0\n"
      ]
     }
    ],
@@ -956,14 +588,14 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 106,
+   "execution_count": 18,
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "0.6944819602546788\n"
+      "0.515820953115956\n"
      ]
     }
    ],
@@ -980,17 +612,17 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 107,
+   "execution_count": 19,
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "(0.35793357933579334, 0.17037470725995316)\n",
-      "(0.3360655737704918, 0.1680327868852459)\n",
-      "(0.6457357075913777, 0.2002324905550712)\n",
-      "(0.6327519379844961, 0.1897704155768672)\n"
+      "(0.49415432579890883, 0.48976438779451525)\n",
+      "(0.49415432579890883, 0.48976438779451525)\n",
+      "(1.0, 0.019204655674102813)\n",
+      "(1.0, 0.026382153249272552)\n"
      ]
     }
    ],
@@ -1023,27 +655,26 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 111,
+   "execution_count": 20,
    "metadata": {},
    "outputs": [],
    "source": [
     "QI2 = [\"parents\", \"has_nurs\", \"form\", \"children\", \"housing\", \"finance\", \"social\", \"health\"]\n",
-    "anonymizer3 = Anonymize(100, QI2, categorical_features=categorical_features)\n",
-    "anon3 = anonymizer3.anonymize(x_train, x_train_predictions)"
+    "QI2_indexes = [i for i, v in enumerate(features) if v in QI2]\n",
+    "anonymizer3 = Anonymize(100, QI2_indexes, categorical_features=categorical_features_indexes)\n",
+    "anon3 = anonymizer3.anonymize(ArrayDataset(x_train, x_train_predictions))"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 112,
+   "execution_count": 21,
    "metadata": {},
    "outputs": [
     {
      "data": {
-      "text/plain": [
-       "39"
-      ]
+      "text/plain": "39"
      },
-     "execution_count": 112,
+     "execution_count": 21,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -1055,22 +686,22 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 113,
+   "execution_count": 22,
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Anonymized model accuracy:  0.7723765432098766\n",
-      "BB attack accuracy:  0.5792012348060969\n",
-      "WB attack accuracy:  0.6680493922438742\n"
+      "Anonymized model accuracy:  0.751929012345679\n",
+      "BB attack accuracy:  1.0\n",
+      "WB attack accuracy:  0.5187150299054601\n"
      ]
     }
    ],
    "source": [
     "anon3_str = anon3.astype(str)\n",
-    "anon3_encoded = OneHotEncoder(sparse=False, drop='if_binary').fit_transform(anon3_str)\n",
+    "anon3_encoded = OneHotEncoder(sparse=False).fit_transform(anon3_str)\n",
     "\n",
     "anon3_model = DecisionTreeClassifier()\n",
     "anon3_model.fit(anon3_encoded, y_train)\n",
@@ -1105,17 +736,17 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 114,
+   "execution_count": 23,
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "(0.35793357933579334, 0.17037470725995316)\n",
-      "(0.3393939393939394, 0.13114754098360656)\n",
-      "(0.6457357075913777, 0.2002324905550712)\n",
-      "(1, 0.0)\n"
+      "(0.49415432579890883, 0.48976438779451525)\n",
+      "(0.49415432579890883, 0.48976438779451525)\n",
+      "(1.0, 0.019204655674102813)\n",
+      "(1.0, 0.032201745877788554)\n"
      ]
     }
    ],
@@ -1162,4 +793,4 @@
  },
  "nbformat": 4,
  "nbformat_minor": 2
-}
+}
\ No newline at end of file
diff --git a/notebooks/membership_inference_anonymization_adult.ipynb b/notebooks/membership_inference_anonymization_adult.ipynb
index c2c7e74..4a0ea00 100644
--- a/notebooks/membership_inference_anonymization_adult.ipynb
+++ b/notebooks/membership_inference_anonymization_adult.ipynb
@@ -29,7 +29,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 97,
+   "execution_count": 6,
    "metadata": {},
    "outputs": [
     {
@@ -44,6 +44,18 @@
       " [  26.   11.    0.    0.   48.]\n",
       " [  27.    9.    0.    0.   40.]]\n"
      ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "/var/folders/9b/qbtw28w53355cvpjs4qn83yc0000gn/T/ipykernel_85828/3975777015.py:22: DeprecationWarning: `np.int` is a deprecated alias for the builtin `int`. To silence this warning, use `int` by itself. Doing this will not modify any behavior and is safe. When replacing `np.int`, you may wish to use e.g. `np.int64` or `np.int32` to specify the precision. If you wish to review your current use, check the release note link for additional information.\n",
+      "Deprecated in NumPy 1.20; for more details and guidance: https://numpy.org/devdocs/release/1.20.0-notes.html#deprecations\n",
+      "  y_train = y_train.astype(np.int)\n",
+      "/var/folders/9b/qbtw28w53355cvpjs4qn83yc0000gn/T/ipykernel_85828/3975777015.py:26: DeprecationWarning: `np.int` is a deprecated alias for the builtin `int`. To silence this warning, use `int` by itself. Doing this will not modify any behavior and is safe. When replacing `np.int`, you may wish to use e.g. `np.int64` or `np.int32` to specify the precision. If you wish to review your current use, check the release note link for additional information.\n",
+      "Deprecated in NumPy 1.20; for more details and guidance: https://numpy.org/devdocs/release/1.20.0-notes.html#deprecations\n",
+      "  y_test = y_test.astype(np.int)\n"
+     ]
     }
    ],
    "source": [
@@ -90,14 +102,14 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 116,
+   "execution_count": 7,
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Base model accuracy:  0.8075056814691972\n"
+      "Base model accuracy:  0.8074442601805786\n"
      ]
     }
    ],
@@ -126,9 +138,18 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 124,
+   "execution_count": 8,
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "/Users/olasaadi/PycharmProjects/ai-privacy-toolkit-internal/venv/lib/python3.8/site-packages/art/attacks/inference/membership_inference/black_box.py:262: DataConversionWarning: A column-vector y was passed when a 1d array was expected. Please change the shape of y to (n_samples,), for example using ravel().\n",
+      "  self.attack_model.fit(np.c_[x_1, x_2], y_ready)  # type: ignore\n"
+     ]
+    }
+   ],
    "source": [
     "from art.attacks.inference.membership_inference import MembershipInferenceBlackBox\n",
     "\n",
@@ -154,14 +175,14 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 125,
+   "execution_count": 9,
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "0.5440363591696352\n"
+      "0.545264709495148\n"
      ]
     }
    ],
@@ -197,7 +218,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 128,
+   "execution_count": 10,
    "metadata": {},
    "outputs": [
     {
@@ -215,6 +236,7 @@
     }
    ],
    "source": [
+    "from apt.utils.datasets import ArrayDataset\n",
     "import os\n",
     "import sys\n",
     "sys.path.insert(0, os.path.abspath('..'))\n",
@@ -223,22 +245,20 @@
     "# QI = (age, education-num, capital-gain, hours-per-week)\n",
     "QI = [0, 1, 2, 4]\n",
     "anonymizer = Anonymize(100, QI)\n",
-    "anon = anonymizer.anonymize(x_train, x_train_predictions)\n",
+    "anon = anonymizer.anonymize(ArrayDataset(x_train, x_train_predictions))\n",
     "print(anon)"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 104,
+   "execution_count": 11,
    "metadata": {},
    "outputs": [
     {
      "data": {
-      "text/plain": [
-       "6739"
-      ]
+      "text/plain": "6739"
      },
-     "execution_count": 104,
+     "execution_count": 11,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -250,16 +270,14 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 129,
+   "execution_count": 12,
    "metadata": {},
    "outputs": [
     {
      "data": {
-      "text/plain": [
-       "658"
-      ]
+      "text/plain": "658"
      },
-     "execution_count": 129,
+     "execution_count": 12,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -278,14 +296,14 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 130,
+   "execution_count": 13,
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Anonymized model accuracy:  0.8304158221239482\n"
+      "Anonymized model accuracy:  0.83078434985566\n"
      ]
     }
    ],
@@ -308,14 +326,22 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 131,
+   "execution_count": 14,
    "metadata": {},
    "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "/Users/olasaadi/PycharmProjects/ai-privacy-toolkit-internal/venv/lib/python3.8/site-packages/art/attacks/inference/membership_inference/black_box.py:262: DataConversionWarning: A column-vector y was passed when a 1d array was expected. Please change the shape of y to (n_samples,), for example using ravel().\n",
+      "  self.attack_model.fit(np.c_[x_1, x_2], y_ready)  # type: ignore\n"
+     ]
+    },
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "0.5034393809114359\n"
+      "0.5047291487532244\n"
      ]
     }
    ],
@@ -345,15 +371,15 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 132,
+   "execution_count": 15,
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "(0.5298924372550654, 0.7806166318634075)\n",
-      "(0.5030507735890172, 0.5671293452892765)\n"
+      "(0.5312420517168291, 0.7696843139663432)\n",
+      "(0.5048372911169745, 0.4935511607910576)\n"
      ]
     }
    ],
@@ -419,4 +445,4 @@
  },
  "nbformat": 4,
  "nbformat_minor": 2
-}
+}
\ No newline at end of file
diff --git a/notebooks/membership_inference_dp_diabetes_reg.ipynb b/notebooks/membership_inference_dp_diabetes_reg.ipynb
index 1376dc6..92922ab 100644
--- a/notebooks/membership_inference_dp_diabetes_reg.ipynb
+++ b/notebooks/membership_inference_dp_diabetes_reg.ipynb
@@ -29,7 +29,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 121,
+   "execution_count": 1,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -50,7 +50,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 122,
+   "execution_count": 2,
    "metadata": {},
    "outputs": [
     {
@@ -86,14 +86,14 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 123,
+   "execution_count": 3,
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "0.4954954954954955\n"
+      "0.527027027027027\n"
      ]
     }
    ],
@@ -131,7 +131,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 124,
+   "execution_count": 4,
    "metadata": {},
    "outputs": [
     {
@@ -141,6 +141,22 @@
       "unique rows in original data:  221\n"
      ]
     },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "/Users/olasaadi/PycharmProjects/ai-privacy-toolkit-internal/venv/lib/python3.8/site-packages/art/attacks/inference/membership_inference/black_box.py:262: DataConversionWarning: A column-vector y was passed when a 1d array was expected. Please change the shape of y to (n_samples,), for example using ravel().\n",
+      "  self.attack_model.fit(np.c_[x_1, x_2], y_ready)  # type: ignore\n",
+      "/Users/olasaadi/PycharmProjects/ai-privacy-toolkit-internal/venv/lib/python3.8/site-packages/art/attacks/inference/membership_inference/black_box.py:262: DataConversionWarning: A column-vector y was passed when a 1d array was expected. Please change the shape of y to (n_samples,), for example using ravel().\n",
+      "  self.attack_model.fit(np.c_[x_1, x_2], y_ready)  # type: ignore\n",
+      "/Users/olasaadi/PycharmProjects/ai-privacy-toolkit-internal/venv/lib/python3.8/site-packages/art/attacks/inference/membership_inference/black_box.py:262: DataConversionWarning: A column-vector y was passed when a 1d array was expected. Please change the shape of y to (n_samples,), for example using ravel().\n",
+      "  self.attack_model.fit(np.c_[x_1, x_2], y_ready)  # type: ignore\n",
+      "/Users/olasaadi/PycharmProjects/ai-privacy-toolkit-internal/venv/lib/python3.8/site-packages/art/attacks/inference/membership_inference/black_box.py:262: DataConversionWarning: A column-vector y was passed when a 1d array was expected. Please change the shape of y to (n_samples,), for example using ravel().\n",
+      "  self.attack_model.fit(np.c_[x_1, x_2], y_ready)  # type: ignore\n",
+      "/Users/olasaadi/PycharmProjects/ai-privacy-toolkit-internal/venv/lib/python3.8/site-packages/art/attacks/inference/membership_inference/black_box.py:262: DataConversionWarning: A column-vector y was passed when a 1d array was expected. Please change the shape of y to (n_samples,), for example using ravel().\n",
+      "  self.attack_model.fit(np.c_[x_1, x_2], y_ready)  # type: ignore\n"
+     ]
+    },
     {
      "name": "stdout",
      "output_type": "stream",
@@ -148,11 +164,12 @@
       "k values:  [5, 10, 20, 50, 75]\n",
       "unique rows: [34, 19, 8, 4, 2]\n",
       "model accuracy: [0.43165832354998956, 0.4509641063206041, -1.730181929385853, -5.577098823982753e+27, -1.2751609045828272e+25]\n",
-      "attack accuracy: [0.5, 0.47297297297297297, 0.49549549549549543, 0.5, 0.47297297297297297]\n"
+      "attack accuracy: [0.509009009009009, 0.481981981981982, 0.509009009009009, 0.5045045045045045, 0.4954954954954955]\n"
      ]
     }
    ],
    "source": [
+    "from apt.utils.datasets import ArrayDataset\n",
     "from apt.anonymization import Anonymize\n",
     "k_values=[5, 10, 20, 50, 75]\n",
     "model_accuracy = []\n",
@@ -165,7 +182,7 @@
     "\n",
     "for k in k_values:\n",
     "    anonymizer = Anonymize(k, QI, is_regression=True)\n",
-    "    anon = anonymizer.anonymize(X_train, x_train_predictions)\n",
+    "    anon = anonymizer.anonymize(ArrayDataset(X_train, x_train_predictions))\n",
     "    unique_values.append(len(np.unique(anon, axis=0)))\n",
     "    \n",
     "    anon_model = LinearRegression()\n",
@@ -198,7 +215,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 124,
+   "execution_count": 4,
    "metadata": {},
    "outputs": [],
    "source": []
diff --git a/notebooks/minimization_adult.ipynb b/notebooks/minimization_adult.ipynb
index 17610a3..e8ccc20 100644
--- a/notebooks/minimization_adult.ipynb
+++ b/notebooks/minimization_adult.ipynb
@@ -27,7 +27,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 1,
+   "execution_count": 15,
    "metadata": {},
    "outputs": [
     {
@@ -42,6 +42,18 @@
       " [2.2000e+01 9.0000e+00 0.0000e+00 0.0000e+00 2.0000e+01]\n",
       " [5.2000e+01 9.0000e+00 1.5024e+04 0.0000e+00 4.0000e+01]]\n"
      ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "/var/folders/9b/qbtw28w53355cvpjs4qn83yc0000gn/T/ipykernel_13726/1357868359.py:22: DeprecationWarning: `np.int` is a deprecated alias for the builtin `int`. To silence this warning, use `int` by itself. Doing this will not modify any behavior and is safe. When replacing `np.int`, you may wish to use e.g. `np.int64` or `np.int32` to specify the precision. If you wish to review your current use, check the release note link for additional information.\n",
+      "Deprecated in NumPy 1.20; for more details and guidance: https://numpy.org/devdocs/release/1.20.0-notes.html#deprecations\n",
+      "  y_train = y_train.astype(np.int)\n",
+      "/var/folders/9b/qbtw28w53355cvpjs4qn83yc0000gn/T/ipykernel_13726/1357868359.py:26: DeprecationWarning: `np.int` is a deprecated alias for the builtin `int`. To silence this warning, use `int` by itself. Doing this will not modify any behavior and is safe. When replacing `np.int`, you may wish to use e.g. `np.int64` or `np.int32` to specify the precision. If you wish to review your current use, check the release note link for additional information.\n",
+      "Deprecated in NumPy 1.20; for more details and guidance: https://numpy.org/devdocs/release/1.20.0-notes.html#deprecations\n",
+      "  y_test = y_test.astype(np.int)\n"
+     ]
     }
    ],
    "source": [
@@ -84,24 +96,27 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 2,
+   "execution_count": 16,
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Base model accuracy:  0.8189914624408821\n"
+      "Base model accuracy:  0.8183158282660771\n"
      ]
     }
    ],
    "source": [
+    "from apt.utils.datasets import ArrayDataset\n",
+    "from apt.utils.models import SklearnClassifier, ModelOutputType\n",
     "from sklearn.tree import DecisionTreeClassifier\n",
     "\n",
-    "model = DecisionTreeClassifier()\n",
-    "model.fit(x_train, y_train)\n",
+    "base_est = DecisionTreeClassifier()\n",
+    "model = SklearnClassifier(base_est, ModelOutputType.CLASSIFIER_VECTOR)\n",
+    "model.fit(ArrayDataset(x_train, y_train))\n",
     "\n",
-    "print('Base model accuracy: ', model.score(x_test, y_test))"
+    "print('Base model accuracy: ', model.score(ArrayDataset(x_test, y_test)))"
    ]
   },
   {
@@ -114,26 +129,26 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 3,
+   "execution_count": 17,
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Initial accuracy of model on generalized data, relative to original model predictions (base generalization derived from tree, before improvements): 0.929376\n",
+      "Initial accuracy of model on generalized data, relative to original model predictions (base generalization derived from tree, before improvements): 0.936540\n",
       "Improving accuracy\n",
-      "feature to remove: 0\n",
-      "Removed feature: 0, new relative accuracy: 0.939867\n",
-      "feature to remove: 4\n",
-      "Removed feature: 4, new relative accuracy: 0.967247\n",
       "feature to remove: 2\n",
-      "Removed feature: 2, new relative accuracy: 0.972620\n",
+      "Removed feature: 2, new relative accuracy: 0.935261\n",
+      "feature to remove: 4\n",
+      "Removed feature: 4, new relative accuracy: 0.946776\n",
+      "feature to remove: 0\n",
+      "Removed feature: 0, new relative accuracy: 0.972876\n",
       "feature to remove: 1\n",
-      "Removed feature: 1, new relative accuracy: 0.992323\n",
+      "Removed feature: 1, new relative accuracy: 0.992835\n",
       "feature to remove: 3\n",
       "Removed feature: 3, new relative accuracy: 1.000000\n",
-      "Accuracy on minimized data:  0.8237371411024106\n"
+      "Accuracy on minimized data:  0.8231229847996315\n"
      ]
     }
    ],
@@ -155,10 +170,12 @@
     "X_generalizer_train, x_test, y_generalizer_train, y_test = train_test_split(x_test, y_test, stratify=y_test,\n",
     "                                                                test_size = 0.4, random_state = 38)\n",
     "x_train_predictions = model.predict(X_generalizer_train)\n",
-    "minimizer.fit(X_generalizer_train, x_train_predictions)\n",
-    "transformed = minimizer.transform(x_test)\n",
+    "if x_train_predictions.shape[1] > 1:\n",
+    "    x_train_predictions = np.argmax(x_train_predictions, axis=1)\n",
+    "minimizer.fit(dataset=ArrayDataset(X_generalizer_train, x_train_predictions))\n",
+    "transformed = minimizer.transform(dataset=ArrayDataset(x_test))\n",
     "\n",
-    "print('Accuracy on minimized data: ', model.score(transformed, y_test))"
+    "print('Accuracy on minimized data: ', model.score(ArrayDataset(transformed, y_test)))"
    ]
   },
   {
@@ -170,14 +187,14 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 4,
+   "execution_count": 18,
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "{'ranges': {}, 'untouched': [0, 1, 2, 3, 4]}\n"
+      "{'ranges': {}, 'categories': {}, 'untouched': ['4', '1', '3', '0', '2']}\n"
      ]
     }
    ],
@@ -197,25 +214,25 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 9,
+   "execution_count": 19,
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Initial accuracy of model on generalized data, relative to original model predictions (base generalization derived from tree, before improvements): 0.929376\n",
+      "Initial accuracy of model on generalized data, relative to original model predictions (base generalization derived from tree, before improvements): 0.936540\n",
       "Improving accuracy\n",
-      "feature to remove: 0\n",
-      "Removed feature: 0, new relative accuracy: 0.939867\n",
-      "feature to remove: 4\n",
-      "Removed feature: 4, new relative accuracy: 0.967247\n",
       "feature to remove: 2\n",
-      "Removed feature: 2, new relative accuracy: 0.972620\n",
+      "Removed feature: 2, new relative accuracy: 0.935261\n",
+      "feature to remove: 4\n",
+      "Removed feature: 4, new relative accuracy: 0.946776\n",
+      "feature to remove: 0\n",
+      "Removed feature: 0, new relative accuracy: 0.972876\n",
       "feature to remove: 1\n",
-      "Removed feature: 1, new relative accuracy: 0.992323\n",
-      "Accuracy on minimized data:  0.820205742361431\n",
-      "{'ranges': {3: [546.0, 704.0, 705.5, 742.5, 782.0, 834.0, 870.0, 1446.5, 1538.5, 1612.5, 1699.0, 1744.0, 1801.0, 1814.0, 1846.0, 1881.5, 1978.5, 2248.0, 2298.5, 2537.5]}, 'untouched': [0, 1, 2, 4]}\n"
+      "Removed feature: 1, new relative accuracy: 0.992835\n",
+      "Accuracy on minimized data:  0.8192845079072624\n",
+      "{'ranges': {'3': [569.0, 782.0, 870.0, 870.5, 938.0, 1016.5, 1311.5, 1457.0, 1494.5, 1596.0, 1629.5, 1684.0, 1805.0, 1859.0, 1867.5, 1881.5, 1938.0, 1978.5, 2119.0, 2210.0, 2218.0, 2244.5, 2298.5, 2443.5]}, 'categories': {}, 'untouched': ['2', '1', '0', '4']}\n"
      ]
     }
    ],
@@ -223,9 +240,9 @@
     "# We allow a 1% deviation in accuracy from the original model accuracy\n",
     "minimizer2 = GeneralizeToRepresentative(model, target_accuracy=0.99)\n",
     "\n",
-    "minimizer2.fit(X_generalizer_train, x_train_predictions)\n",
-    "transformed2 = minimizer2.transform(x_test)\n",
-    "print('Accuracy on minimized data: ', model.score(transformed2, y_test))\n",
+    "minimizer2.fit(dataset=ArrayDataset(X_generalizer_train, x_train_predictions))\n",
+    "transformed2 = minimizer2.transform(dataset=ArrayDataset(x_test))\n",
+    "print('Accuracy on minimized data: ', model.score(test_data=ArrayDataset(transformed2, y_test)))\n",
     "generalizations2 = minimizer2.generalizations\n",
     "print(generalizations2)"
    ]
@@ -259,4 +276,4 @@
  },
  "nbformat": 4,
  "nbformat_minor": 2
-}
+}
\ No newline at end of file
diff --git a/requirements.txt b/requirements.txt
index fa4131d..ec37771 100644
--- a/requirements.txt
+++ b/requirements.txt
@@ -2,6 +2,7 @@ numpy==1.21.0
 pandas==1.1.0
 scipy==1.4.1
 scikit-learn==0.22.2
+adversarial-robustness-toolkit>=1.9.1
 
 # testing
 pytest==5.4.2
diff --git a/tests/test_anonymizer.py b/tests/test_anonymizer.py
index 000eefa..358398c 100644
--- a/tests/test_anonymizer.py
+++ b/tests/test_anonymizer.py
@@ -7,13 +7,15 @@ from sklearn.tree import DecisionTreeClassifier, DecisionTreeRegressor
 from sklearn.preprocessing import OneHotEncoder
 
 from apt.anonymization import Anonymize
-from apt.utils import get_iris_dataset, get_adult_dataset, get_nursery_dataset
+from apt.utils.dataset_utils import get_iris_dataset, get_adult_dataset, get_nursery_dataset
 from sklearn.datasets import load_diabetes
 from sklearn.model_selection import train_test_split
+from apt.utils.datasets import ArrayDataset, DATA_PANDAS_NUMPY_TYPE
 
 
 def test_anonymize_ndarray_iris():
     (x_train, y_train), _ = get_iris_dataset()
+
     model = DecisionTreeClassifier()
     model.fit(x_train, y_train)
     pred = model.predict(x_train)
@@ -21,7 +23,7 @@ def test_anonymize_ndarray_iris():
     k = 10
     QI = [0, 2]
     anonymizer = Anonymize(k, QI, train_only_QI=True)
-    anon = anonymizer.anonymize(x_train, pred)
+    anon = anonymizer.anonymize(ArrayDataset(x_train, pred))
     assert(len(np.unique(anon[:, QI], axis=0)) < len(np.unique(x_train[:, QI], axis=0)))
     _, counts_elements = np.unique(anon[:, QI], return_counts=True)
     assert (np.min(counts_elements) >= k)
@@ -30,10 +32,14 @@ def test_anonymize_ndarray_iris():
 
 def test_anonymize_pandas_adult():
     (x_train, y_train), _ = get_adult_dataset()
+    encoded = OneHotEncoder().fit_transform(x_train)
+    model = DecisionTreeClassifier()
+    model.fit(encoded, y_train)
+    pred = model.predict(encoded)
 
     k = 100
-    features = ['age', 'workclass', 'education-num', 'marital-status', 'occupation',
-                'relationship', 'race', 'sex', 'capital-gain', 'capital-loss', 'hours-per-week', 'native-country']
+    features = ['age', 'workclass', 'education-num', 'marital-status', 'occupation', 'relationship', 'race', 'sex',
+                'capital-gain', 'capital-loss', 'hours-per-week', 'native-country']
     QI = ['age', 'workclass', 'education-num', 'marital-status', 'occupation', 'relationship', 'race', 'sex',
           'native-country']
     categorical_features = ['workclass', 'marital-status', 'occupation', 'relationship', 'race', 'sex',
@@ -56,12 +62,11 @@ def test_anonymize_pandas_adult():
     pred = model.predict(encoded)
 
     anonymizer = Anonymize(k, QI, categorical_features=categorical_features)
-    anon = anonymizer.anonymize(x_train, pred)
+    anon = anonymizer.anonymize(ArrayDataset(x_train, pred, features))
 
     assert(anon.loc[:, QI].drop_duplicates().shape[0] < x_train.loc[:, QI].drop_duplicates().shape[0])
     assert (anon.loc[:, QI].value_counts().min() >= k)
-    assert (anon.drop(QI, axis=1).equals(x_train.drop(QI, axis=1)))
-
+    np.testing.assert_array_equal(anon.drop(QI, axis=1), x_train.drop(QI, axis=1))
 
 def test_anonymize_pandas_nursery():
     (x_train, y_train), _ = get_nursery_dataset()
@@ -89,11 +94,11 @@ def test_anonymize_pandas_nursery():
     pred = model.predict(encoded)
 
     anonymizer = Anonymize(k, QI, categorical_features=categorical_features, train_only_QI=True)
-    anon = anonymizer.anonymize(x_train, pred)
+    anon = anonymizer.anonymize(ArrayDataset(x_train, pred))
 
     assert(anon.loc[:, QI].drop_duplicates().shape[0] < x_train.loc[:, QI].drop_duplicates().shape[0])
     assert (anon.loc[:, QI].value_counts().min() >= k)
-    assert (anon.drop(QI, axis=1).equals(x_train.drop(QI, axis=1)))
+    np.testing.assert_array_equal(anon.drop(QI, axis=1), x_train.drop(QI, axis=1))
 
 
 def test_regression():
@@ -107,7 +112,7 @@ def test_regression():
     k = 10
     QI = [0, 2, 5, 8]
     anonymizer = Anonymize(k, QI, is_regression=True, train_only_QI=True)
-    anon = anonymizer.anonymize(x_train, pred)
+    anon = anonymizer.anonymize(ArrayDataset(x_train, pred))
     print('Base model accuracy (R2 score): ', model.score(x_test, y_test))
     model.fit(anon, y_train)
     print('Base model accuracy (R2 score) after anonymization: ', model.score(x_test, y_test))
@@ -127,7 +132,7 @@ def test_errors():
     anonymizer = Anonymize(10, [0, 2])
     (x_train, y_train), (x_test, y_test) = get_iris_dataset()
     with pytest.raises(ValueError):
-        anonymizer.anonymize(x_train, y_test)
+        anonymizer.anonymize(dataset=ArrayDataset(x_train, y_test))
     (x_train, y_train), _ = get_adult_dataset()
     with pytest.raises(ValueError):
-        anonymizer.anonymize(x_train, y_train)
+        anonymizer.anonymize(dataset=ArrayDataset(x_train, y_test))
diff --git a/tests/test_minimizer.py b/tests/test_minimizer.py
index e6f50be..630cd49 100644
--- a/tests/test_minimizer.py
+++ b/tests/test_minimizer.py
@@ -5,14 +5,15 @@ from sklearn.compose import ColumnTransformer
 
 from sklearn.datasets import load_boston, load_diabetes
 from sklearn.impute import SimpleImputer
-from sklearn.linear_model import LogisticRegression
 from sklearn.model_selection import train_test_split
 from sklearn.pipeline import Pipeline
-from sklearn.preprocessing import OneHotEncoder, StandardScaler
+from sklearn.preprocessing import OneHotEncoder
 
 from apt.minimization import GeneralizeToRepresentative
 from sklearn.tree import DecisionTreeClassifier, DecisionTreeRegressor
-from apt.utils import get_iris_dataset, get_adult_dataset, get_nursery_dataset, get_german_credit_dataset
+from apt.utils.dataset_utils import get_iris_dataset, get_adult_dataset, get_nursery_dataset, get_german_credit_dataset
+from apt.utils.datasets import ArrayDataset
+from apt.utils.models import SklearnClassifier, ModelOutputType, SklearnRegressor
 
 
 @pytest.fixture
@@ -38,11 +39,12 @@ def test_minimizer_params(data):
     y = [1, 1, 0]
     base_est = DecisionTreeClassifier(random_state=0, min_samples_split=2,
                                       min_samples_leaf=1)
-    base_est.fit(X, y)
+    model = SklearnClassifier(base_est, ModelOutputType.CLASSIFIER_VECTOR)
+    model.fit(ArrayDataset(X, y))
 
-    gen = GeneralizeToRepresentative(base_est, features=features, cells=cells)
+    gen = GeneralizeToRepresentative(model, cells=cells)
     gen.fit()
-    transformed = gen.transform(X)
+    transformed = gen.transform(dataset=ArrayDataset(X, features_names=features))
 
 
 def test_minimizer_fit(data):
@@ -58,15 +60,20 @@ def test_minimizer_fit(data):
                   [69, 175],
                   [24, 181],
                   [18, 190]])
-    y = [1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0]
+    y = np.array([1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0])
     base_est = DecisionTreeClassifier(random_state=0, min_samples_split=2,
                                       min_samples_leaf=1)
-    base_est.fit(X, y)
-    predictions = base_est.predict(X)
+    model = SklearnClassifier(base_est, ModelOutputType.CLASSIFIER_VECTOR)
+    model.fit(ArrayDataset(X, y))
+    predictions = model.predict(X)
+    if predictions.shape[1] > 1:
+        predictions = np.argmax(predictions, axis=1)
 
-    gen = GeneralizeToRepresentative(base_est, features=features, target_accuracy=0.5)
-    gen.fit(X, predictions)
-    transformed = gen.transform(X)
+    gen = GeneralizeToRepresentative(model, target_accuracy=0.5)
+    train_dataset = ArrayDataset(X, predictions, features_names=features)
+
+    gen.fit(dataset=train_dataset)
+    transformed = gen.transform(dataset=ArrayDataset(X))
     gener = gen.generalizations_
     expexted_generalizations = {'ranges': {}, 'categories': {}, 'untouched': ['height', 'age']}
 
@@ -103,7 +110,7 @@ def test_minimizer_fit_pandas(data):
          [69, 175, 'm', 'aa'],
          [24, 181, 'm', 'bb'],
          [18, 190, 'm', 'bb']]
-    y = [1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0]
+    y = np.array([1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0])
     X = pd.DataFrame(X, columns=features)
 
     numeric_features = ["age", "height"]
@@ -121,16 +128,22 @@ def test_minimizer_fit_pandas(data):
         ]
     )
     encoded = preprocessor.fit_transform(X)
+    encoded = pd.DataFrame(encoded)
     base_est = DecisionTreeClassifier(random_state=0, min_samples_split=2,
                                       min_samples_leaf=1)
-    base_est.fit(encoded, y)
-    predictions = base_est.predict(encoded)
+    model = SklearnClassifier(base_est, ModelOutputType.CLASSIFIER_VECTOR)
+    model.fit(ArrayDataset(encoded, y))
+    predictions = model.predict(encoded)
+    if predictions.shape[1] > 1:
+        predictions = np.argmax(predictions, axis=1)
+
     # Append classifier to preprocessing pipeline.
     # Now we have a full prediction pipeline.
-    gen = GeneralizeToRepresentative(base_est, features=features, target_accuracy=0.5,
+    gen = GeneralizeToRepresentative(model, target_accuracy=0.5,
                                      categorical_features=categorical_features)
-    gen.fit(X, predictions)
-    transformed = gen.transform(X)
+    train_dataset = ArrayDataset(X, predictions)
+    gen.fit(dataset=train_dataset)
+    transformed = gen.transform(dataset=ArrayDataset(X))
     gener = gen.generalizations_
     expexted_generalizations = {'ranges': {'age': []}, 'categories': {}, 'untouched': ['ola', 'height', 'sex']}
 
@@ -143,7 +156,7 @@ def test_minimizer_fit_pandas(data):
     modified_features = [f for f in features if
                          f in expexted_generalizations['categories'].keys() or f in expexted_generalizations[
                              'ranges'].keys()]
-    assert (transformed.drop(modified_features, axis=1).equals(X.drop(modified_features, axis=1)))
+    np.testing.assert_array_equal(transformed.drop(modified_features, axis=1), X.drop(modified_features, axis=1))
     ncp = gen.ncp_
     if len(expexted_generalizations['ranges'].keys()) > 0 or len(expexted_generalizations['categories'].keys()) > 0:
         assert (ncp > 0)
@@ -179,7 +192,7 @@ def test_minimizer_params_categorical(data):
          [24, 181, 'm'],
          [18, 190, 'm']]
 
-    y = [1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0]
+    y = np.array([1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0])
     X = pd.DataFrame(X, columns=features)
     numeric_features = ["age", "height"]
     numeric_transformer = Pipeline(
@@ -196,16 +209,21 @@ def test_minimizer_params_categorical(data):
         ]
     )
     encoded = preprocessor.fit_transform(X)
+    encoded = pd.DataFrame(encoded)
     base_est = DecisionTreeClassifier(random_state=0, min_samples_split=2,
                                       min_samples_leaf=1)
-    base_est.fit(encoded, y)
-    predictions = base_est.predict(encoded)
+    model = SklearnClassifier(base_est, ModelOutputType.CLASSIFIER_VECTOR)
+    model.fit(ArrayDataset(encoded, y))
+    predictions = model.predict(encoded)
+    if predictions.shape[1] > 1:
+        predictions = np.argmax(predictions, axis=1)
     # Append classifier to preprocessing pipeline.
     # Now we have a full prediction pipeline.
-    gen = GeneralizeToRepresentative(base_est, features=features, target_accuracy=0.5,
+    gen = GeneralizeToRepresentative(model, target_accuracy=0.5,
                                      categorical_features=categorical_features, cells=cells)
-    gen.fit(X, predictions)
-    transformed = gen.transform(X)
+    train_dataset = ArrayDataset(X, predictions)
+    gen.fit(dataset=train_dataset)
+    transformed = gen.transform(dataset=ArrayDataset(X))
 
 
 def test_minimizer_fit_QI(data):
@@ -222,16 +240,20 @@ def test_minimizer_fit_QI(data):
                   [24, 181, 95],
                   [18, 190, 102]])
     print(X)
-    y = [1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0]
-    QI = [0, 2]
+    y = np.array([1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0])
+    QI = ['age', 'weight']
     base_est = DecisionTreeClassifier(random_state=0, min_samples_split=2,
                                       min_samples_leaf=1)
-    base_est.fit(X, y)
-    predictions = base_est.predict(X)
+    model = SklearnClassifier(base_est, ModelOutputType.CLASSIFIER_VECTOR)
+    model.fit(ArrayDataset(X, y))
+    predictions = model.predict(X)
+    if predictions.shape[1] > 1:
+        predictions = np.argmax(predictions, axis=1)
 
-    gen = GeneralizeToRepresentative(base_est, features=features, target_accuracy=0.5, features_to_minimize=QI)
-    gen.fit(X, predictions)
-    transformed = gen.transform(X)
+    gen = GeneralizeToRepresentative(model, target_accuracy=0.5, features_to_minimize=QI)
+    train_dataset = ArrayDataset(X, predictions, features_names=features)
+    gen.fit(dataset=train_dataset)
+    transformed = gen.transform(dataset=ArrayDataset(X))
     gener = gen.generalizations_
     expexted_generalizations = {'ranges': {'age': [], 'weight': [67.5]}, 'categories': {}, 'untouched': ['height']}
     for key in expexted_generalizations['ranges']:
@@ -240,7 +262,7 @@ def test_minimizer_fit_QI(data):
         assert (set([frozenset(sl) for sl in expexted_generalizations['categories'][key]]) ==
                 set([frozenset(sl) for sl in gener['categories'][key]]))
     assert (set(expexted_generalizations['untouched']) == set(gener['untouched']))
-    assert ((np.delete(transformed, QI, axis=1) == np.delete(X, QI, axis=1)).all())
+    assert ((np.delete(transformed, [0, 2], axis=1) == np.delete(X, [0, 2], axis=1)).all())
     modified_features = [f for f in features if
                          f in expexted_generalizations['categories'].keys() or f in expexted_generalizations[
                              'ranges'].keys()]
@@ -269,7 +291,7 @@ def test_minimizer_fit_pandas_QI(data):
          [24, 181, 49, 'm', 'bb'],
          [18, 190, 69, 'm', 'bb']]
 
-    y = [1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0]
+    y = pd.Series([1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0])
     X = pd.DataFrame(X, columns=features)
     QI = ['age', 'weight', 'ola']
 
@@ -288,16 +310,22 @@ def test_minimizer_fit_pandas_QI(data):
         ]
     )
     encoded = preprocessor.fit_transform(X)
+    encoded = pd.DataFrame(encoded)
     base_est = DecisionTreeClassifier(random_state=0, min_samples_split=2,
                                       min_samples_leaf=1)
-    base_est.fit(encoded, y)
-    predictions = base_est.predict(encoded)
+    model = SklearnClassifier(base_est, ModelOutputType.CLASSIFIER_VECTOR)
+    model.fit(ArrayDataset(encoded, y))
+    predictions = model.predict(encoded)
+    if predictions.shape[1] > 1:
+        predictions = np.argmax(predictions, axis=1)
+
     # Append classifier to preprocessing pipeline.
     # Now we have a full prediction pipeline.
-    gen = GeneralizeToRepresentative(base_est, features=features, target_accuracy=0.5,
+    gen = GeneralizeToRepresentative(model, target_accuracy=0.5,
                                      categorical_features=categorical_features, features_to_minimize=QI)
-    gen.fit(X, predictions)
-    transformed = gen.transform(X)
+    train_dataset = ArrayDataset(X, predictions)
+    gen.fit(dataset=train_dataset)
+    transformed = gen.transform(dataset=ArrayDataset(X))
     gener = gen.generalizations_
     expexted_generalizations = {'ranges': {'age': [], 'weight': [47.0]}, 'categories': {'ola': [['bb', 'aa']]},
                                 'untouched': ['height', 'sex']}
@@ -308,12 +336,13 @@ def test_minimizer_fit_pandas_QI(data):
         assert (set([frozenset(sl) for sl in expexted_generalizations['categories'][key]]) ==
                 set([frozenset(sl) for sl in gener['categories'][key]]))
     assert (set(expexted_generalizations['untouched']) == set(gener['untouched']))
-    assert (transformed.drop(QI, axis=1).equals(X.drop(QI, axis=1)))
-
+    # assert (transformed.drop(QI, axis=1).equals(X.drop(QI, axis=1)))
+    np.testing.assert_array_equal(transformed.drop(QI, axis=1), X.drop(QI, axis=1))
     modified_features = [f for f in features if
                          f in expexted_generalizations['categories'].keys() or f in expexted_generalizations[
                              'ranges'].keys()]
-    assert (transformed.drop(modified_features, axis=1).equals(X.drop(modified_features, axis=1)))
+    # assert (transformed.drop(modified_features, axis=1).equals(X.drop(modified_features, axis=1)))
+    np.testing.assert_array_equal(transformed.drop(modified_features, axis=1), X.drop(modified_features, axis=1))
     ncp = gen.ncp_
     if len(expexted_generalizations['ranges'].keys()) > 0 or len(expexted_generalizations['categories'].keys()) > 0:
         assert (ncp > 0)
@@ -322,16 +351,19 @@ def test_minimizer_fit_pandas_QI(data):
 
 def test_minimize_ndarray_iris():
     features = ['sepal length (cm)', 'sepal width (cm)', 'petal length (cm)', 'petal width (cm)']
-    (x_train, y_train), _ = get_iris_dataset()
-    QI = [0, 2]
-    model = DecisionTreeClassifier(random_state=0, min_samples_split=2,
-                                   min_samples_leaf=1)
-    model.fit(x_train, y_train)
-    pred = model.predict(x_train)
+    (x_train, y_train), (x_test, y_test) = get_iris_dataset()
+    QI = ['sepal length (cm)', 'petal length (cm)']
+    base_est = DecisionTreeClassifier(random_state=0, min_samples_split=2,
+                                      min_samples_leaf=1)
+    model = SklearnClassifier(base_est, ModelOutputType.CLASSIFIER_VECTOR)
+    model.fit(ArrayDataset(x_train, y_train))
+    predictions = model.predict(x_train)
+    if predictions.shape[1] > 1:
+        predictions = np.argmax(predictions, axis=1)
 
-    gen = GeneralizeToRepresentative(model, target_accuracy=0.3, features=features, features_to_minimize=QI)
-    gen.fit(x_train, pred)
-    transformed = gen.transform(x_train)
+    gen = GeneralizeToRepresentative(model, target_accuracy=0.3, features_to_minimize=QI)
+    # gen.fit(dataset=ArrayDataset(x_train, predictions))
+    transformed = gen.fit_transform(dataset=ArrayDataset(x_train, predictions, features_names=features))
     gener = gen.generalizations_
     expexted_generalizations = {'ranges': {'sepal length (cm)': [], 'petal length (cm)': [2.449999988079071]},
                                 'categories': {}, 'untouched': ['petal width (cm)', 'sepal width (cm)']}
@@ -342,7 +374,7 @@ def test_minimize_ndarray_iris():
         assert (set([frozenset(sl) for sl in expexted_generalizations['categories'][key]]) ==
                 set([frozenset(sl) for sl in gener['categories'][key]]))
     assert (set(expexted_generalizations['untouched']) == set(gener['untouched']))
-    assert ((np.delete(transformed, QI, axis=1) == np.delete(x_train, QI, axis=1)).all())
+    assert ((np.delete(transformed, [0, 2], axis=1) == np.delete(x_train, [0, 2], axis=1)).all())
 
     modified_features = [f for f in features if
                          f in expexted_generalizations['categories'].keys() or f in expexted_generalizations[
@@ -359,12 +391,13 @@ def test_minimize_ndarray_iris():
 
 
 def test_minimize_pandas_adult():
-    (x_train, y_train), _ = get_adult_dataset()
+    (x_train, y_train), (x_test, y_test) = get_adult_dataset()
     x_train = x_train.head(1000)
     y_train = y_train.head(1000)
 
     features = ['age', 'workclass', 'education-num', 'marital-status', 'occupation', 'relationship', 'race', 'sex',
                 'capital-gain', 'capital-loss', 'hours-per-week', 'native-country']
+    x_train = pd.DataFrame(x_train, columns=features)
 
     categorical_features = ['workclass', 'marital-status', 'occupation', 'relationship', 'race', 'sex',
                             'hours-per-week', 'native-country']
@@ -384,15 +417,19 @@ def test_minimize_pandas_adult():
         ]
     )
     encoded = preprocessor.fit_transform(x_train)
+    encoded = pd.DataFrame(encoded)
     base_est = DecisionTreeClassifier(random_state=0, min_samples_split=2,
                                       min_samples_leaf=1)
-    base_est.fit(encoded, y_train)
-    predictions = base_est.predict(encoded)
+    model = SklearnClassifier(base_est, ModelOutputType.CLASSIFIER_VECTOR)
+    model.fit(ArrayDataset(encoded, y_train))
+    predictions = model.predict(encoded)
+    if predictions.shape[1] > 1:
+        predictions = np.argmax(predictions, axis=1)
 
-    gen = GeneralizeToRepresentative(base_est, target_accuracy=0.7, features=features,
+    gen = GeneralizeToRepresentative(model, target_accuracy=0.7,
                                      categorical_features=categorical_features, features_to_minimize=QI)
-    gen.fit(x_train, predictions)
-    transformed = gen.transform(x_train)
+    gen.fit(dataset=ArrayDataset(x_train, predictions, features_names=features))
+    transformed = gen.transform(dataset=ArrayDataset(x_train))
     gener = gen.generalizations_
     expexted_generalizations = {'ranges': {'age': [], 'education-num': []}, 'categories': {
         'workclass': [['Self-emp-not-inc', 'Private', 'Federal-gov', 'Self-emp-inc', '?', 'Local-gov', 'State-gov']],
@@ -414,12 +451,14 @@ def test_minimize_pandas_adult():
         assert (set([frozenset(sl) for sl in expexted_generalizations['categories'][key]]) ==
                 set([frozenset(sl) for sl in gener['categories'][key]]))
     assert (set(expexted_generalizations['untouched']) == set(gener['untouched']))
-    assert (transformed.drop(QI, axis=1).equals(x_train.drop(QI, axis=1)))
+    # assert (transformed.drop(QI, axis=1).equals(x_train.drop(QI, axis=1)))
+    np.testing.assert_array_equal(transformed.drop(QI, axis=1), x_train.drop(QI, axis=1))
 
     modified_features = [f for f in features if
                          f in expexted_generalizations['categories'].keys() or f in expexted_generalizations[
                              'ranges'].keys()]
-    assert (transformed.drop(modified_features, axis=1).equals(x_train.drop(modified_features, axis=1)))
+    # assert (transformed.drop(modified_features, axis=1).equals(x_train.drop(modified_features, axis=1)))
+    np.testing.assert_array_equal(transformed.drop(modified_features, axis=1), x_train.drop(modified_features, axis=1))
     ncp = gen.ncp_
     if len(expexted_generalizations['ranges'].keys()) > 0 or len(expexted_generalizations['categories'].keys()) > 0:
         assert (ncp > 0)
@@ -451,15 +490,19 @@ def test_german_credit_pandas():
         ]
     )
     encoded = preprocessor.fit_transform(x_train)
+    encoded = pd.DataFrame(encoded)
     base_est = DecisionTreeClassifier(random_state=0, min_samples_split=2,
                                       min_samples_leaf=1)
-    base_est.fit(encoded, y_train)
-    predictions = base_est.predict(encoded)
+    model = SklearnClassifier(base_est, ModelOutputType.CLASSIFIER_VECTOR)
+    model.fit(ArrayDataset(encoded, y_train))
+    predictions = model.predict(encoded)
+    if predictions.shape[1] > 1:
+        predictions = np.argmax(predictions, axis=1)
 
-    gen = GeneralizeToRepresentative(base_est, target_accuracy=0.7, features=features,
+    gen = GeneralizeToRepresentative(model, target_accuracy=0.7,
                                      categorical_features=categorical_features, features_to_minimize=QI)
-    gen.fit(x_train, predictions)
-    transformed = gen.transform(x_train)
+    gen.fit(dataset=ArrayDataset(x_train, predictions))
+    transformed = gen.transform(dataset=ArrayDataset(x_train))
     gener = gen.generalizations_
     expexted_generalizations = {'ranges': {'Duration_in_month': [31.5]},
                                 'categories': {'Credit_history': [['A30', 'A32', 'A31', 'A34', 'A33']], 'Purpose': [
@@ -481,12 +524,14 @@ def test_german_credit_pandas():
         assert (set([frozenset(sl) for sl in expexted_generalizations['categories'][key]]) ==
                 set([frozenset(sl) for sl in gener['categories'][key]]))
     assert (set(expexted_generalizations['untouched']) == set(gener['untouched']))
-    assert (transformed.drop(QI, axis=1).equals(x_train.drop(QI, axis=1)))
+    # assert (transformed.drop(QI, axis=1).equals(x_train.drop(QI, axis=1)))
+    np.testing.assert_array_equal(transformed.drop(QI, axis=1), x_train.drop(QI, axis=1))
 
     modified_features = [f for f in features if
                          f in expexted_generalizations['categories'].keys() or f in expexted_generalizations[
                              'ranges'].keys()]
-    assert (transformed.drop(modified_features, axis=1).equals(x_train.drop(modified_features, axis=1)))
+    # assert (transformed.drop(modified_features, axis=1).equals(x_train.drop(modified_features, axis=1)))
+    np.testing.assert_array_equal(transformed.drop(modified_features, axis=1), x_train.drop(modified_features, axis=1))
     ncp = gen.ncp_
     if len(expexted_generalizations['ranges'].keys()) > 0 or len(expexted_generalizations['categories'].keys()) > 0:
         assert (ncp > 0)
@@ -497,17 +542,258 @@ def test_regression():
     dataset = load_diabetes()
     x_train, x_test, y_train, y_test = train_test_split(dataset.data, dataset.target, test_size=0.5, random_state=14)
 
-    model = DecisionTreeRegressor(random_state=10, min_samples_split=2)
-    model.fit(x_train, y_train)
-    pred = model.predict(x_train)
-    QI = [0, 2, 5, 8]
+    base_est = DecisionTreeRegressor(random_state=10, min_samples_split=2)
+    model = SklearnRegressor(base_est)
+    model.fit(ArrayDataset(x_train, y_train))
+    predictions = model.predict(x_train)
+    QI = ['age', 'bmi', 's2', 's5']
     features = ['age', 'sex', 'bmi', 'bp',
                 's1', 's2', 's3', 's4', 's5', 's6']
 
-    gen = GeneralizeToRepresentative(model, target_accuracy=0.7, features=features, is_regression=True,
+    gen = GeneralizeToRepresentative(model, target_accuracy=0.7, is_regression=True,
                                      features_to_minimize=QI)
-    gen.fit(x_train, pred)
-    transformed = gen.transform(x_train)
+    gen.fit(dataset=ArrayDataset(x_train, predictions, features_names=features))
+    transformed = gen.transform(dataset=ArrayDataset(x_train, features_names=features))
+    print('Base model accuracy (R2 score): ', model.score(ArrayDataset(x_test, y_test)))
+    model.fit(ArrayDataset(transformed, y_train))
+    print('Base model accuracy (R2 score) after anonymization: ', model.score(ArrayDataset(x_test, y_test)))
+    gener = gen.generalizations_
+    expexted_generalizations = {'ranges': {
+        'age': [-0.07816532626748085, -0.07090024650096893, -0.05637009255588055, -0.05092128552496433,
+                -0.04728874587453902, -0.04547247663140297, -0.04183994047343731, -0.027309784665703773,
+                -0.023677248042076826, -0.020044708624482155, -0.01641217083670199, -0.001882016600575298,
+                0.0017505218856967986, 0.0035667913616634905, 0.007199329789727926, 0.010831868276000023,
+                0.02354575227946043, 0.030810829252004623, 0.03262709779664874, 0.03444336913526058,
+                0.03625963814556599, 0.03807590529322624, 0.03807590715587139, 0.047157252207398415,
+                0.06168740428984165, 0.0635036751627922, 0.06895248219370842, 0.07258502021431923, 0.07621755823493004,
+                0.1034616008400917],
+        'bmi': [-0.07626373693346977, -0.060635464265942574, -0.056863121688365936, -0.05578530766069889,
+                -0.054168591275811195, -0.042312657460570335, -0.0374625027179718, -0.03422906715422869,
+                -0.033690162003040314, -0.03261234890669584, -0.02614547684788704, -0.025067666545510292,
+                -0.022373135201632977, -0.016984074376523495, -0.01375063881278038, -0.007822672137990594,
+                -0.004589236050378531, 0.008344509289599955, 0.015889193629845977, 0.016967005096375942,
+                0.024511689320206642, 0.0272062208969146, 0.030978563241660595, 0.032595280557870865,
+                0.033673093654215336, 0.04391230642795563, 0.04552902653813362, 0.05469042807817459,
+                0.06977979838848114, 0.07301323488354683, 0.09349166229367256],
+        's2': [-0.1044962927699089, -0.08649025857448578, -0.07740895450115204, -0.07114598527550697,
+               -0.06378699466586113, -0.05971606448292732, -0.04437179118394852, -0.0398311372846365,
+               -0.03137612994760275, -0.022138250060379505, -0.018067320343106985, -0.017910746857523918,
+               -0.017910745926201344, -0.01618842873722315, -0.007576846517622471, -0.007263698382303119,
+               -0.0010007291566580534, 0.0010347360512241721, 0.006514834007248282, 0.00933317095041275,
+               0.012464655097573996, 0.019197346206055954, 0.020919663831591606, 0.02217225730419159,
+               0.032036433927714825, 0.036420512944459915, 0.04080459102988243, 0.04127431474626064,
+               0.04268348217010498, 0.04424922354519367, 0.04424922540783882, 0.056462014093995094, 0.05928034894168377,
+               0.061315815430134535, 0.06272498145699501, 0.06460387445986271]}, 'categories': {},
+        'untouched': ['s5', 's3', 'bp', 's1', 'sex', 's6', 's4']}
+
+    for key in expexted_generalizations['ranges']:
+        assert (set(expexted_generalizations['ranges'][key]) == set(gener['ranges'][key]))
+    for key in expexted_generalizations['categories']:
+        assert (set([frozenset(sl) for sl in expexted_generalizations['categories'][key]]) ==
+                set([frozenset(sl) for sl in gener['categories'][key]]))
+    assert (set(expexted_generalizations['untouched']) == set(gener['untouched']))
+    assert ((np.delete(transformed, [0, 2, 5, 8], axis=1) == np.delete(x_train, [0, 2, 5, 8], axis=1)).all())
+
+    modified_features = [f for f in features if
+                         f in expexted_generalizations['categories'].keys() or f in expexted_generalizations[
+                             'ranges'].keys()]
+    indexes = []
+    for i in range(len(features)):
+        if features[i] in modified_features:
+            indexes.append(i)
+    assert ((np.delete(transformed, indexes, axis=1) == np.delete(x_train, indexes, axis=1)).all())
+    ncp = gen.ncp_
+    if len(expexted_generalizations['ranges'].keys()) > 0 or len(expexted_generalizations['categories'].keys()) > 0:
+        assert (ncp > 0)
+        assert (((transformed[indexes]) != (x_train[indexes])).any())
+
+
+def test_X_y(data):
+    features = [0, 1, 2]
+    X = np.array([[23, 165, 70],
+                  [45, 158, 67],
+                  [56, 123, 65],
+                  [67, 154, 90],
+                  [45, 149, 67],
+                  [42, 166, 58],
+                  [73, 172, 68],
+                  [94, 168, 69],
+                  [69, 175, 80],
+                  [24, 181, 95],
+                  [18, 190, 102]])
+    print(X)
+    y = np.array([1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0])
+    QI = [0, 2]
+    base_est = DecisionTreeClassifier(random_state=0, min_samples_split=2,
+                                      min_samples_leaf=1)
+    model = SklearnClassifier(base_est, ModelOutputType.CLASSIFIER_VECTOR)
+    model.fit(ArrayDataset(X, y))
+    predictions = model.predict(X)
+    if predictions.shape[1] > 1:
+        predictions = np.argmax(predictions, axis=1)
+
+    gen = GeneralizeToRepresentative(model, target_accuracy=0.5, features_to_minimize=QI)
+    gen.fit(X=X, y=predictions)
+    transformed = gen.transform(X)
+    gener = gen.generalizations_
+    expexted_generalizations = {'ranges': {'0': [], '2': [67.5]}, 'categories': {}, 'untouched': ['1']}
+    for key in expexted_generalizations['ranges']:
+        assert (set(expexted_generalizations['ranges'][key]) == set(gener['ranges'][key]))
+    for key in expexted_generalizations['categories']:
+        assert (set([frozenset(sl) for sl in expexted_generalizations['categories'][key]]) ==
+                set([frozenset(sl) for sl in gener['categories'][key]]))
+    assert (set(expexted_generalizations['untouched']) == set(gener['untouched']))
+    assert ((np.delete(transformed, [0, 2], axis=1) == np.delete(X, [0, 2], axis=1)).all())
+    modified_features = [f for f in features if
+                         str(f) in expexted_generalizations['categories'].keys() or str(f) in expexted_generalizations[
+                             'ranges'].keys()]
+    indexes = []
+    for i in range(len(features)):
+        if features[i] in modified_features:
+            indexes.append(i)
+    assert ((np.delete(transformed, indexes, axis=1) == np.delete(X, indexes, axis=1)).all())
+    ncp = gen.ncp_
+    if len(expexted_generalizations['ranges'].keys()) > 0 or len(expexted_generalizations['categories'].keys()) > 0:
+        assert (ncp > 0)
+        assert (((transformed[indexes]) != (X[indexes])).any())
+
+
+def test_X_y_features_names(data):
+    features = ['age', 'height', 'weight']
+    X = np.array([[23, 165, 70],
+                  [45, 158, 67],
+                  [56, 123, 65],
+                  [67, 154, 90],
+                  [45, 149, 67],
+                  [42, 166, 58],
+                  [73, 172, 68],
+                  [94, 168, 69],
+                  [69, 175, 80],
+                  [24, 181, 95],
+                  [18, 190, 102]])
+    print(X)
+    y = np.array([1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0])
+    QI = ['age', 'weight']
+    base_est = DecisionTreeClassifier(random_state=0, min_samples_split=2,
+                                      min_samples_leaf=1)
+    model = SklearnClassifier(base_est, ModelOutputType.CLASSIFIER_VECTOR)
+    model.fit(ArrayDataset(X, y))
+    predictions = model.predict(X)
+    if predictions.shape[1] > 1:
+        predictions = np.argmax(predictions, axis=1)
+
+    gen = GeneralizeToRepresentative(model, target_accuracy=0.5, features_to_minimize=QI)
+    gen.fit(X=X, y=predictions, features_names=features)
+    transformed = gen.transform(X=X, features_names=features)
+    gener = gen.generalizations_
+    expexted_generalizations = {'ranges': {'age': [], 'weight': [67.5]}, 'categories': {}, 'untouched': ['height']}
+    for key in expexted_generalizations['ranges']:
+        assert (set(expexted_generalizations['ranges'][key]) == set(gener['ranges'][key]))
+    for key in expexted_generalizations['categories']:
+        assert (set([frozenset(sl) for sl in expexted_generalizations['categories'][key]]) ==
+                set([frozenset(sl) for sl in gener['categories'][key]]))
+    assert (set(expexted_generalizations['untouched']) == set(gener['untouched']))
+    assert ((np.delete(transformed, [0, 2], axis=1) == np.delete(X, [0, 2], axis=1)).all())
+    modified_features = [f for f in features if
+                         f in expexted_generalizations['categories'].keys() or f in expexted_generalizations[
+                             'ranges'].keys()]
+    indexes = []
+    for i in range(len(features)):
+        if features[i] in modified_features:
+            indexes.append(i)
+    assert ((np.delete(transformed, indexes, axis=1) == np.delete(X, indexes, axis=1)).all())
+    ncp = gen.ncp_
+    if len(expexted_generalizations['ranges'].keys()) > 0 or len(expexted_generalizations['categories'].keys()) > 0:
+        assert (ncp > 0)
+        assert (((transformed[indexes]) != (X[indexes])).any())
+
+
+def test_BaseEstimator_classification(data):
+    features = ['age', 'height', 'weight', 'sex', 'ola']
+    X = [[23, 165, 65, 'f', 'aa'],
+         [45, 158, 76, 'f', 'aa'],
+         [56, 123, 78, 'f', 'bb'],
+         [67, 154, 87, 'm', 'aa'],
+         [45, 149, 45, 'f', 'bb'],
+         [42, 166, 76, 'm', 'bb'],
+         [73, 172, 85, 'm', 'bb'],
+         [94, 168, 92, 'f', 'aa'],
+         [69, 175, 95, 'm', 'aa'],
+         [24, 181, 49, 'm', 'bb'],
+         [18, 190, 69, 'm', 'bb']]
+
+    y = pd.Series([1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0])
+    X = pd.DataFrame(X, columns=features)
+    QI = ['age', 'weight', 'ola']
+
+    numeric_features = ["age", "height", "weight"]
+    numeric_transformer = Pipeline(
+        steps=[('imputer', SimpleImputer(strategy='constant', fill_value=0))]
+    )
+
+    categorical_features = ["sex", "ola"]
+    categorical_transformer = OneHotEncoder(handle_unknown="ignore")
+
+    preprocessor = ColumnTransformer(
+        transformers=[
+            ("num", numeric_transformer, numeric_features),
+            ("cat", categorical_transformer, categorical_features),
+        ]
+    )
+    encoded = preprocessor.fit_transform(X)
+    encoded = pd.DataFrame(encoded)
+    base_est = DecisionTreeClassifier(random_state=0, min_samples_split=2,
+                                      min_samples_leaf=1)
+    model = base_est
+    model.fit(encoded, y)
+    predictions = model.predict(encoded)
+
+    # Append classifier to preprocessing pipeline.
+    # Now we have a full prediction pipeline.
+    gen = GeneralizeToRepresentative(model, target_accuracy=0.5,
+                                     categorical_features=categorical_features, features_to_minimize=QI)
+    train_dataset = ArrayDataset(X, predictions)
+    gen.fit(dataset=train_dataset)
+    transformed = gen.transform(dataset=ArrayDataset(X))
+    gener = gen.generalizations_
+    expexted_generalizations = {'ranges': {'age': [], 'weight': [47.0]}, 'categories': {'ola': [['bb', 'aa']]},
+                                'untouched': ['height', 'sex']}
+
+    for key in expexted_generalizations['ranges']:
+        assert (set(expexted_generalizations['ranges'][key]) == set(gener['ranges'][key]))
+    for key in expexted_generalizations['categories']:
+        assert (set([frozenset(sl) for sl in expexted_generalizations['categories'][key]]) ==
+                set([frozenset(sl) for sl in gener['categories'][key]]))
+    assert (set(expexted_generalizations['untouched']) == set(gener['untouched']))
+    # assert (transformed.drop(QI, axis=1).equals(X.drop(QI, axis=1)))
+    np.testing.assert_array_equal(transformed.drop(QI, axis=1), X.drop(QI, axis=1))
+    modified_features = [f for f in features if
+                         f in expexted_generalizations['categories'].keys() or f in expexted_generalizations[
+                             'ranges'].keys()]
+    # assert (transformed.drop(modified_features, axis=1).equals(X.drop(modified_features, axis=1)))
+    np.testing.assert_array_equal(transformed.drop(modified_features, axis=1), X.drop(modified_features, axis=1))
+    ncp = gen.ncp_
+    if len(expexted_generalizations['ranges'].keys()) > 0 or len(expexted_generalizations['categories'].keys()) > 0:
+        assert (ncp > 0)
+        assert (((transformed[modified_features]).equals(X[modified_features])) == False)
+
+
+def test_BaseEstimator_regression():
+    dataset = load_diabetes()
+    x_train, x_test, y_train, y_test = train_test_split(dataset.data, dataset.target, test_size=0.5, random_state=14)
+
+    base_est = DecisionTreeRegressor(random_state=10, min_samples_split=2)
+    model = base_est
+    model.fit(x_train, y_train)
+    predictions = model.predict(x_train)
+    QI = ['age', 'bmi', 's2', 's5']
+    features = ['age', 'sex', 'bmi', 'bp',
+                's1', 's2', 's3', 's4', 's5', 's6']
+
+    gen = GeneralizeToRepresentative(model, target_accuracy=0.7, is_regression=True,
+                                     features_to_minimize=QI)
+    gen.fit(dataset=ArrayDataset(x_train, predictions, features_names=features))
+    transformed = gen.transform(dataset=ArrayDataset(x_train, features_names=features))
     print('Base model accuracy (R2 score): ', model.score(x_test, y_test))
     model.fit(transformed, y_train)
     print('Base model accuracy (R2 score) after minimization: ', model.score(x_test, y_test))
@@ -546,7 +832,7 @@ def test_regression():
         assert (set([frozenset(sl) for sl in expexted_generalizations['categories'][key]]) ==
                 set([frozenset(sl) for sl in gener['categories'][key]]))
     assert (set(expexted_generalizations['untouched']) == set(gener['untouched']))
-    assert ((np.delete(transformed, QI, axis=1) == np.delete(x_train, QI, axis=1)).all())
+    assert ((np.delete(transformed, [0, 2, 5, 8], axis=1) == np.delete(x_train, [0, 2, 5, 8], axis=1)).all())
 
     modified_features = [f for f in features if
                          f in expexted_generalizations['categories'].keys() or f in expexted_generalizations[
diff --git a/tests/test_model.py b/tests/test_model.py
new file mode 100644
index 0000000..bbb951b
--- /dev/null
+++ b/tests/test_model.py
@@ -0,0 +1,35 @@
+import pytest
+
+from apt.utils.models import SklearnClassifier, SklearnRegressor, ModelOutputType
+from apt.utils.datasets import ArrayDataset
+from apt.utils import dataset_utils
+
+from sklearn.tree import DecisionTreeRegressor
+from sklearn.ensemble import RandomForestClassifier
+
+
+def test_sklearn_classifier():
+    (x_train, y_train), (x_test, y_test) = dataset_utils.get_iris_dataset()
+    underlying_model = RandomForestClassifier()
+    model = SklearnClassifier(underlying_model, ModelOutputType.CLASSIFIER_VECTOR)
+    train = ArrayDataset(x_train, y_train)
+    test = ArrayDataset(x_test, y_test)
+    model.fit(train)
+    pred = model.predict(x_test)
+    assert(pred.shape[0] == x_test.shape[0])
+
+    score = model.score(test)
+    assert(0.0 <= score <= 1.0)
+
+
+def test_sklearn_regressor():
+    (x_train, y_train), (x_test, y_test) = dataset_utils.get_diabetes_dataset()
+    underlying_model = DecisionTreeRegressor()
+    model = SklearnRegressor(underlying_model)
+    train = ArrayDataset(x_train, y_train)
+    test = ArrayDataset(x_test, y_test)
+    model.fit(train)
+    pred = model.predict(x_test)
+    assert (pred.shape[0] == x_test.shape[0])
+
+    score = model.score(test)

From adc6b44350be23ab23863ba4c669564175af6cb6 Mon Sep 17 00:00:00 2001
From: abigailgold <57357634+abigailgold@users.noreply.github.com>
Date: Sun, 1 May 2022 15:18:07 +0300
Subject: [PATCH 06/26] Bump version and update documentation (#27)

* Bump version to 0.1.0 (breaking changes to some APIs)
* Update documentation
---
 apt/__init__.py                   |  2 +-
 docs/conf.py                      |  2 +-
 docs/source/apt.anonymization.rst | 12 ++++++------
 docs/source/apt.minimization.rst  | 12 ++++++------
 docs/source/apt.rst               | 24 +++++++-----------------
 docs/source/modules.rst           |  5 ++---
 setup.cfg                         |  2 +-
 7 files changed, 24 insertions(+), 35 deletions(-)

diff --git a/apt/__init__.py b/apt/__init__.py
index ea6178a..135bd33 100644
--- a/apt/__init__.py
+++ b/apt/__init__.py
@@ -6,4 +6,4 @@ from apt import anonymization
 from apt import minimization
 from apt import utils
 
-__version__ = "0.0.4"
\ No newline at end of file
+__version__ = "0.1.0"
\ No newline at end of file
diff --git a/docs/conf.py b/docs/conf.py
index 36cdd76..6452871 100644
--- a/docs/conf.py
+++ b/docs/conf.py
@@ -22,7 +22,7 @@ copyright = '2021, IBM'
 author = 'Abigail Goldsteen'
 
 # The full version, including alpha/beta/rc tags
-release = '0.0.4'
+release = '0.1.0'
 
 master_doc = 'index'
 
diff --git a/docs/source/apt.anonymization.rst b/docs/source/apt.anonymization.rst
index 727706b..6453554 100644
--- a/docs/source/apt.anonymization.rst
+++ b/docs/source/apt.anonymization.rst
@@ -8,15 +8,15 @@ apt.anonymization.anonymizer module
 -----------------------------------
 
 .. automodule:: apt.anonymization.anonymizer
-    :members:
-    :undoc-members:
-    :show-inheritance:
+   :members:
+   :undoc-members:
+   :show-inheritance:
 
 
 Module contents
 ---------------
 
 .. automodule:: apt.anonymization
-    :members:
-    :undoc-members:
-    :show-inheritance:
+   :members:
+   :undoc-members:
+   :show-inheritance:
diff --git a/docs/source/apt.minimization.rst b/docs/source/apt.minimization.rst
index 0be47c8..417fc68 100644
--- a/docs/source/apt.minimization.rst
+++ b/docs/source/apt.minimization.rst
@@ -8,15 +8,15 @@ apt.minimization.minimizer module
 ---------------------------------
 
 .. automodule:: apt.minimization.minimizer
-    :members:
-    :undoc-members:
-    :show-inheritance:
+   :members:
+   :undoc-members:
+   :show-inheritance:
 
 
 Module contents
 ---------------
 
 .. automodule:: apt.minimization
-    :members:
-    :undoc-members:
-    :show-inheritance:
+   :members:
+   :undoc-members:
+   :show-inheritance:
diff --git a/docs/source/apt.rst b/docs/source/apt.rst
index fbe1c02..ebbf65f 100644
--- a/docs/source/apt.rst
+++ b/docs/source/apt.rst
@@ -5,26 +5,16 @@ Subpackages
 -----------
 
 .. toctree::
+   :maxdepth: 4
 
-    apt.anonymization
-    apt.minimization
-
-Submodules
-----------
-
-apt.utils module
-----------------
-
-.. automodule:: apt.utils
-    :members:
-    :undoc-members:
-    :show-inheritance:
-
+   apt.anonymization
+   apt.minimization
+   apt.utils
 
 Module contents
 ---------------
 
 .. automodule:: apt
-    :members:
-    :undoc-members:
-    :show-inheritance:
+   :members:
+   :undoc-members:
+   :show-inheritance:
diff --git a/docs/source/modules.rst b/docs/source/modules.rst
index 9b7541d..c187881 100644
--- a/docs/source/modules.rst
+++ b/docs/source/modules.rst
@@ -1,8 +1,7 @@
-ai-privacy-toolkit
-==================
+apt
+===
 
 .. toctree::
    :maxdepth: 4
 
    apt
-   tests
diff --git a/setup.cfg b/setup.cfg
index 2e79a5f..f478210 100644
--- a/setup.cfg
+++ b/setup.cfg
@@ -1,7 +1,7 @@
 [metadata]
 # replace with your username:
 name = ai-privacy-toolkit
-version = 0.0.4
+version = 0.1.0
 author = Abigail Goldsteen
 author_email = abigailt@il.ibm.com
 description = A toolkit for tools and techniques related to the privacy and compliance of AI models.

From 014aed96707c30ee95a68319edc77254f98f703d Mon Sep 17 00:00:00 2001
From: abigailgold <57357634+abigailgold@users.noreply.github.com>
Date: Sun, 1 May 2022 15:49:18 +0300
Subject: [PATCH 07/26] Update requirements (#28)

* Bump version to 0.1.0 (breaking changes to some APIs)
* Update documentation
* Update requirements
---
 requirements.txt | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/requirements.txt b/requirements.txt
index ec37771..e1133d4 100644
--- a/requirements.txt
+++ b/requirements.txt
@@ -2,7 +2,7 @@ numpy==1.21.0
 pandas==1.1.0
 scipy==1.4.1
 scikit-learn==0.22.2
-adversarial-robustness-toolkit>=1.9.1
+adversarial-robustness-toolbox>=1.10.1
 
 # testing
 pytest==5.4.2

From fd6be8e7782ba4672ec7554ea22ec681c1373d88 Mon Sep 17 00:00:00 2001
From: abigailgold <57357634+abigailgold@users.noreply.github.com>
Date: Mon, 2 May 2022 11:46:18 +0300
Subject: [PATCH 08/26] Documentation updates (#29)

* Bump version to 0.1.0 (breaking changes to some APIs)

* Update documentation

* Update requirements

* gitignore
---
 .gitignore                         | 160 ++++++++++++++++
 apt/anonymization/anonymizer.py    |  38 ++--
 apt/minimization/minimizer.py      | 199 +++++++++-----------
 apt/utils/dataset_utils.py         |  56 +++---
 apt/utils/datasets/datasets.py     | 285 ++++++++++++++++++++---------
 apt/utils/models/model.py          |  46 ++---
 apt/utils/models/sklearn_model.py  |  63 ++++---
 docs/conf.py                       |   7 +-
 docs/source/apt.utils.datasets.rst |  22 +++
 docs/source/apt.utils.models.rst   |  30 +++
 docs/source/apt.utils.rst          |  31 ++++
 requirements.txt                   |   1 +
 12 files changed, 640 insertions(+), 298 deletions(-)
 create mode 100644 .gitignore
 create mode 100644 docs/source/apt.utils.datasets.rst
 create mode 100644 docs/source/apt.utils.models.rst
 create mode 100644 docs/source/apt.utils.rst

diff --git a/.gitignore b/.gitignore
new file mode 100644
index 0000000..b0b6f3a
--- /dev/null
+++ b/.gitignore
@@ -0,0 +1,160 @@
+# Byte-compiled / optimized / DLL files
+__pycache__/
+*.py[cod]
+*$py.class
+
+# C extensions
+*.so
+
+# Distribution / packaging
+.Python
+build/
+develop-eggs/
+dist/
+downloads/
+eggs/
+.eggs/
+lib/
+lib64/
+parts/
+sdist/
+var/
+wheels/
+share/python-wheels/
+*.egg-info/
+.installed.cfg
+*.egg
+MANIFEST
+
+# PyInstaller
+#  Usually these files are written by a python script from a template
+#  before PyInstaller builds the exe, so as to inject date/other infos into it.
+*.manifest
+*.spec
+
+# Installer logs
+pip-log.txt
+pip-delete-this-directory.txt
+
+# Unit test / coverage reports
+htmlcov/
+.tox/
+.nox/
+.coverage
+.coverage.*
+.cache
+nosetests.xml
+coverage.xml
+*.cover
+*.py,cover
+.hypothesis/
+.pytest_cache/
+cover/
+
+# Translations
+*.mo
+*.pot
+
+# Django stuff:
+*.log
+local_settings.py
+db.sqlite3
+db.sqlite3-journal
+
+# Flask stuff:
+instance/
+.webassets-cache
+
+# Scrapy stuff:
+.scrapy
+
+# Sphinx documentation
+docs/_build/
+
+# PyBuilder
+.pybuilder/
+target/
+
+# Jupyter Notebook
+.ipynb_checkpoints
+
+# IPython
+profile_default/
+ipython_config.py
+
+# pyenv
+#   For a library or package, you might want to ignore these files since the code is
+#   intended to run in multiple environments; otherwise, check them in:
+# .python-version
+
+# pipenv
+#   According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control.
+#   However, in case of collaboration, if having platform-specific dependencies or dependencies
+#   having no cross-platform support, pipenv may install dependencies that don't work, or not
+#   install all needed dependencies.
+#Pipfile.lock
+
+# poetry
+#   Similar to Pipfile.lock, it is generally recommended to include poetry.lock in version control.
+#   This is especially recommended for binary packages to ensure reproducibility, and is more
+#   commonly ignored for libraries.
+#   https://python-poetry.org/docs/basic-usage/#commit-your-poetrylock-file-to-version-control
+#poetry.lock
+
+# pdm
+#   Similar to Pipfile.lock, it is generally recommended to include pdm.lock in version control.
+#pdm.lock
+#   pdm stores project-wide configurations in .pdm.toml, but it is recommended to not include it
+#   in version control.
+#   https://pdm.fming.dev/#use-with-ide
+.pdm.toml
+
+# PEP 582; used by e.g. github.com/David-OConnor/pyflow and github.com/pdm-project/pdm
+__pypackages__/
+
+# Celery stuff
+celerybeat-schedule
+celerybeat.pid
+
+# SageMath parsed files
+*.sage.py
+
+# Environments
+.env
+.venv
+env/
+venv/
+ENV/
+env.bak/
+venv.bak/
+
+# Spyder project settings
+.spyderproject
+.spyproject
+
+# Rope project settings
+.ropeproject
+
+# mkdocs documentation
+/site
+
+# mypy
+.mypy_cache/
+.dmypy.json
+dmypy.json
+
+# Pyre type checker
+.pyre/
+
+# pytype static type analyzer
+.pytype/
+
+# Cython debug symbols
+cython_debug/
+
+# PyCharm
+#  JetBrains specific template is maintained in a separate JetBrains.gitignore that can
+#  be found at https://github.com/github/gitignore/blob/main/Global/JetBrains.gitignore
+#  and can be added to the global gitignore or merged into this file.  For a more nuclear
+#  option (not recommended) you can uncomment the following to ignore the entire idea folder.
+.idea/
\ No newline at end of file
diff --git a/apt/anonymization/anonymizer.py b/apt/anonymization/anonymizer.py
index 02854f5..909cae7 100644
--- a/apt/anonymization/anonymizer.py
+++ b/apt/anonymization/anonymizer.py
@@ -19,27 +19,25 @@ class Anonymize:
 
     Based on the implementation described in: https://arxiv.org/abs/2007.13086
 
-    Parameters
-    ----------
-    k : int
-        The privacy parameter that determines the number of records that will be indistinguishable from each
-        other (when looking at the quasi identifiers). Should be at least 2.
-    quasi_identifiers : np.ndarray or list
-        The features that need to be minimized in case of pandas data, and indexes of features
-        in case of numpy data.
-    categorical_features : list, optional
-        The list of categorical features (should only be supplied when passing data as a
-        pandas dataframe.
-    is_regression : Bool, optional
-        Whether the model is a regression model or not (if False, assumes
-        a classification model). Default is False.
-    train_only_QI : Bool, optional
-        The required method to train data set for anonymization. Default is
-        to train the tree on all features.
+    :param k: The privacy parameter that determines the number of records that will be indistinguishable from each
+              other (when looking at the quasi identifiers). Should be at least 2.
+    :type k: int
+    :param quasi_identifiers: The features that need to be minimized in case of pandas data, and indexes of features
+                              in case of numpy data.
+    :type quasi_identifiers: np.ndarray or list
+    :param categorical_features: The list of categorical features (if supplied, these featurtes will be one-hot encoded
+                                 before using them to train the decision tree model).
+    :type categorical_features: list, optional
+    :param is_regression: Whether the model is a regression model or not (if False, assumes a classification model).
+                          Default is False.
+    :type is_regression: list, optional
+    :param train_only_QI: The required method to train data set for anonymization. Default is
+                          to train the tree on all features.
+    :type train_only_QI: boolean, optional
     """
 
     def __init__(self, k: int, quasi_identifiers: Union[np.ndarray, list], categorical_features: Optional[list] = None,
-                 is_regression=False, train_only_QI=False):
+                 is_regression: Optional[bool] = False, train_only_QI: Optional[bool] = False):
         if k < 2:
             raise ValueError("k should be a positive integer with a value of 2 or higher")
         if quasi_identifiers is None or len(quasi_identifiers) < 1:
@@ -59,7 +57,9 @@ class Anonymize:
 
         :param dataset: Data wrapper containing the training data for the model and the predictions of the
                         original model on the training data.
-        :return: An array containing the anonymized training dataset.
+        :type dataset: `ArrayDataset`
+        :return: The anonymized training dataset as either numpy array or pandas DataFrame (depending on the type of
+                 the original data used to create the ArrayDataset).
         """
         if dataset.get_samples().shape[1] != 0:
             self.features = [i for i in range(dataset.get_samples().shape[1])]
diff --git a/apt/minimization/minimizer.py b/apt/minimization/minimizer.py
index 27b6b6e..7d538b0 100644
--- a/apt/minimization/minimizer.py
+++ b/apt/minimization/minimizer.py
@@ -21,7 +21,8 @@ from apt.utils.models import Model, SklearnRegressor, ModelOutputType, SklearnCl
 
 
 class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerMixin):
-    """ A transformer that generalizes data to representative points.
+    """
+    A transformer that generalizes data to representative points.
 
     Learns data generalizations based on an original model's predictions
     and a target accuracy. Once the generalizations are learned, can
@@ -34,52 +35,33 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
     need to supply an existing ``estimator`` to init.
     In summary, either ``estimator`` and ``target_accuracy`` should be
     supplied or ``cells`` should be supplied.
-    Parameters
-    ----------
-    estimator : estimator, optional
-        The original model for which generalization is being performed.
-        Should be pre-fitted.
-    target_accuracy : float, optional
-        The required accuracy when applying the base model to the
-        generalized data. Accuracy is measured relative to the original
-        accuracy of the model.
-    categorical_features: list of str, optional
-        The list of categorical features should only be supplied when
-         passing data as a pandas dataframe.
-    features_to_minimize: List of str or numbers, optional
-        The features that need to be minimized in case of pandas data,
-         and indexes of features in case of numpy data.
-    cells : list of object, optional
-        The cells used to generalize records. Each cell must define a
-        range or subset of categories for each feature, as well as a
-        representative value for each feature.
-        This parameter should be used when instantiating a transformer
-        object without first fitting it.
-    train_only_QI : Bool, optional
-        The required method to train data set for minimizing. Default is
-        to train the tree just on the features that are given as
-        features_to_minimize.
-    is_regression : Bool, optional
-        Whether the model is a regression model or not (if False, assumes
-        a classification model). Default is False.
 
-    Attributes
-    ----------
-    features_ : list of str
-        The feature names, in the order that they appear in the data.
-    cells_ : list of object
-        The cells used to generalize records, as learned when calling fit.
-    ncp_ : float
-        The NCP (information loss) score of the resulting generalization,
-        as measured on the training data.
-    generalizations_ : object
-        The generalizations that were learned (actual feature ranges).
+    :param estimator: The original model for which generalization is being performed. Should be pre-fitted.
+    :type estimator: sklearn `BaseEstimator` or `Model`
+    :param target_accuracy: The required relative accuracy when applying the base model to the generalized data.
+                            Accuracy is measured relative to the original accuracy of the model.
+    :type target_accuracy: float, optional
+    :param cells: The cells used to generalize records. Each cell must define a range or subset of categories for
+                  each feature, as well as a representative value for each feature. This parameter should be used
+                  when instantiating a transformer object without first fitting it.
+    :type cells: list of objects, optional
+    :param categorical_features: The list of categorical features (if supplied, these featurtes will be one-hot
+                                 encoded before using them to train the decision tree model).
+    :type categorical_features: list of strings, optional
+    :param features_to_minimize: The features to be minimized.
+    :type features_to_minimize: list of strings or int, optional
+    :param train_only_QI: Whether to train the tree just on the ``features_to_minimize`` or on all features. Default
+                          is only on ``features_to_minimize``.
+    :type train_only_QI: boolean, optional
+    :param is_regression: Whether the model is a regression model or not (if False, assumes a classification model).
+                          Default is False.
+    :type is_regression: boolean, optional
     """
 
-    def __init__(self, estimator: Union[BaseEstimator, Model] = None, target_accuracy: float = 0.998,
-                 cells: list = None, categorical_features: Union[np.ndarray, list] = None,
-                 features_to_minimize: Union[np.ndarray, list] = None, train_only_QI: bool = True,
-                 is_regression: bool = False):
+    def __init__(self, estimator: Union[BaseEstimator, Model] = None, target_accuracy: Optional[float] = 0.998,
+                 cells: Optional[list] = None, categorical_features: Optional[Union[np.ndarray, list]] = None,
+                 features_to_minimize: Optional[Union[np.ndarray, list]] = None, train_only_QI: Optional[bool] = True,
+                 is_regression: Optional[bool] = False):
         if issubclass(estimator.__class__, Model):
             self.estimator = estimator
         else:
@@ -97,18 +79,13 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
         self.is_regression = is_regression
 
     def get_params(self, deep=True):
-        """Get parameters for this estimator.
+        """
+        Get parameters
 
-        Parameters
-        ----------
-        deep : boolean, optional
-            If True, will return the parameters for this estimator and contained
-            subobjects that are estimators.
-
-        Returns
-        -------
-        params : mapping of string to any
-            Parameter names mapped to their values.
+        :param deep: If True, will return the parameters for this estimator and contained
+                     sub-objects that are estimators.
+        :type deep: boolean, optional
+        :return: Parameter names mapped to their values
         """
         ret = {}
         ret['target_accuracy'] = self.target_accuracy
@@ -120,12 +97,17 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
         return ret
 
     def set_params(self, **params):
-        """Set the parameters of this estimator.
+        """
+        Set parameters
 
-        Returns
-        -------
-        self : object
-            Returns self.
+        :param target_accuracy: The required relative accuracy when applying the base model to the generalized data.
+                                Accuracy is measured relative to the original accuracy of the model.
+        :type target_accuracy: float, optional
+        :param cells: The cells used to generalize records. Each cell must define a range or subset of categories for
+                      each feature, as well as a representative value for each feature. This parameter should be used
+                      when instantiating a transformer object without first fitting it.
+        :type cells: list of objects, optional
+        :return: self
         """
         if 'target_accuracy' in params:
             self.target_accuracy = params['target_accuracy']
@@ -135,29 +117,32 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
 
     @property
     def generalizations(self):
+        """
+        Return the generalizations derived from the model and test data.
+
+        :return: generalizations object. Contains 3 sections: 'ranges' that contains ranges for numerical features,
+                                 'categories' that contains sub-groups of categories for categorical features, and
+                                 'untouched' that contains the features that could not be generalized.
+        """
         return self.generalizations_
 
     def fit_transform(self, X: Optional[DATA_PANDAS_NUMPY_TYPE] = None, y: Optional[DATA_PANDAS_NUMPY_TYPE] = None,
-                      features_names: Optional = None, dataset: Optional[ArrayDataset] = None):
-        """Learns the generalizations based on training data, and applies them to the data.
+                      features_names: Optional[list] = None, dataset: Optional[ArrayDataset] = None):
+        """
+        Learns the generalizations based on training data, and applies them to the data.
 
-        Parameters
-        ----------
-        X : {array-like, sparse matrix}, shape (n_samples, n_features), optional
-            The training input samples.
-        y : array-like, shape (n_samples,), optional
-            The target values. An array of int.
-            This should contain the predictions of the original model on ``X``.
-        features_names : list of str, The feature names, in the order that they appear in the data,
-                        provided just if X and y were provided (optional).
-        dataset : Data wrapper containing the training input samples and the predictions of the
-                  original model on the training data.
-        Either X,y OR dataset need to be provided, not both.
-        Returns
-        -------
-        X_transformed : numpy or pandas according to the input type, shape (n_samples, n_features)
-            The array containing the representative values to which each record in
-            ``X`` is mapped.
+        :param X: The training input samples.
+        :type X: {array-like, sparse matrix}, shape (n_samples, n_features), optional
+        :param y: The target values. This should contain the predictions of the original model on ``X``.
+        :type y: array-like, shape (n_samples,), optional
+        :param features_names: The feature names, in the order that they appear in the data. Can be provided when
+                               passing the data as ``X`` and ``y``
+        :type features_names: list of strings, optional
+        :param dataset: Data wrapper containing the training input samples and the predictions of the original model
+                        on the training data. Either ``X``, ``y`` OR ``dataset`` need to be provided, not both.
+        :type dataset: `ArrayDataset`, optional
+        :return: Array containing the representative values to which each record in ``X`` is mapped, as numpy array or
+                 pandas DataFrame (depending on the type of ``X``), shape (n_samples, n_features)
         """
         self.fit(X, y, features_names, dataset=dataset)
         return self.transform(X, features_names, dataset=dataset)
@@ -166,23 +151,17 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
             features_names: Optional = None, dataset: ArrayDataset = None):
         """Learns the generalizations based on training data.
 
-        Parameters
-        ----------
-        X : {array-like, sparse matrix}, shape (n_samples, n_features), optional
-            The training input samples.
-        y : array-like, shape (n_samples,), optional
-            The target values. An array of int.
-            This should contain the predictions of the original model on ``X``.
-        features_names : list of str, The feature names, in the order that they appear in the data,
-                        provided just if X and y were provided (optional).
-        dataset : Data wrapper containing the training input samples and the predictions of the
-                  original model on the training data.
-        Either X,y OR dataset need to be provided, not both.
-        Returns
-        -------
-        X_transformed : numpy or pandas according to the input type, shape (n_samples, n_features)
-            The array containing the representative values to which each record in
-            ``X`` is mapped.
+        :param X: The training input samples.
+        :type X: {array-like, sparse matrix}, shape (n_samples, n_features), optional
+        :param y: The target values. This should contain the predictions of the original model on ``X``.
+        :type y: array-like, shape (n_samples,), optional
+        :param features_names: The feature names, in the order that they appear in the data. Can be provided when
+                               passing the data as ``X`` and ``y``
+        :type features_names: list of strings, optional
+        :param dataset: Data wrapper containing the training input samples and the predictions of the original model
+                        on the training data. Either ``X``, ``y`` OR ``dataset`` need to be provided, not both.
+        :type dataset: `ArrayDataset`, optional
+        :return: self
         """
 
         # take into account that estimator, X, y, cells, features may be None
@@ -242,7 +221,6 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
                 used_X_train = X_train_QI
 
             # collect feature data (such as min, max)
-
             feature_data = {}
             for feature in self._features:
                 if feature not in feature_data.keys():
@@ -386,23 +364,20 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
         # Return the transformer
         return self
 
-    def transform(self, X: Optional[DATA_PANDAS_NUMPY_TYPE] = None, features_names: Optional = None, dataset: ArrayDataset = None):
+    def transform(self, X: Optional[DATA_PANDAS_NUMPY_TYPE] = None, features_names: Optional[list] = None,
+                  dataset: Optional[ArrayDataset] = None):
         """ Transforms data records to representative points.
 
-        Parameters
-        ----------
-        X : {array-like, sparse-matrix}, shape (n_samples, n_features), If provided as a pandas dataframe,
-         may contain both numeric and categorical data.
-            The input samples.
-        features_names : list of str, The feature names, in the order that they appear in the data,
-                        provided just if X was provided (optional).
-        dataset : Data wrapper containing the training input samples.
-        Either X OR dataset need to be provided, not both.
-        Returns
-        -------
-        X_transformed : numpy or pandas according to the input type, shape (n_samples, n_features)
-            The array containing the representative values to which each record in
-            ``X`` is mapped.
+        :param X: The training input samples.
+        :type X: {array-like, sparse matrix}, shape (n_samples, n_features), optional
+        :param features_names: The feature names, in the order that they appear in the data. Can be provided when
+                               passing the data as ``X`` and ``y``
+        :type features_names: list of strings, optional
+        :param dataset: Data wrapper containing the training input samples and the predictions of the original model
+                        on the training data. Either ``X`` OR ``dataset`` need to be provided, not both.
+        :type dataset: `ArrayDataset`, optional
+        :return: Array containing the representative values to which each record in ``X`` is mapped, as numpy array or
+                 pandas DataFrame (depending on the type of ``X``), shape (n_samples, n_features)
         """
 
         # Check if fit has been called
diff --git a/apt/utils/dataset_utils.py b/apt/utils/dataset_utils.py
index e3eb959..e395717 100644
--- a/apt/utils/dataset_utils.py
+++ b/apt/utils/dataset_utils.py
@@ -6,6 +6,17 @@ from os import path, mkdir
 from six.moves.urllib.request import urlretrieve
 
 
+def get_iris_dataset(test_set: float = 0.3):
+    """
+    Loads the Iris dataset from scikit-learn.
+
+    :param test_set: Proportion of the data to use as validation split (value between 0 and 1). Default is 0.3
+    :type test_set: float
+    :return: Entire dataset and labels as numpy arrays. Returned as a tuple (x_train, y_train), (x_test, y_test)
+    """
+    return _load_iris(test_set)
+
+
 def _load_iris(test_set_size: float = 0.3):
     iris = datasets.load_iris()
     data = iris.data
@@ -18,14 +29,15 @@ def _load_iris(test_set_size: float = 0.3):
     return (x_train, y_train), (x_test, y_test)
 
 
-def get_iris_dataset(test_set: float = 0.3):
+def get_diabetes_dataset(test_set: float = 0.3):
     """
-    Loads the Iris dataset from scikit-learn.
+    Loads the Diabetes dataset from scikit-learn.
 
-    :param test_set: Proportion of the data to use as validation split (value between 0 and 1).
-    :return: Entire dataset and labels as numpy array.
+    :param test_set: Proportion of the data to use as validation split (value between 0 and 1). Default is 0.3
+    :type test_set: float
+    :return: Entire dataset and labels as numpy arrays. Returned as a tuple (x_train, y_train), (x_test, y_test)
     """
-    return _load_iris(test_set)
+    return _load_diabetes(test_set)
 
 
 def _load_diabetes(test_set_size: float = 0.3):
@@ -40,22 +52,14 @@ def _load_diabetes(test_set_size: float = 0.3):
     return (x_train, y_train), (x_test, y_test)
 
 
-def get_diabetes_dataset():
-    """
-    Loads the Iris dataset from scikit-learn.
-
-    :param test_set: Proportion of the data to use as validation split (value between 0 and 1).
-    :return: Entire dataset and labels as numpy array.
-    """
-    return _load_diabetes()
-
-
 def get_german_credit_dataset(test_set: float = 0.3):
     """
-    Loads the UCI German_credit dataset from `tests/datasets/german` or downloads it if necessary.
+    Loads the UCI German credit dataset from `tests/datasets/german` or downloads it from
+    https://archive.ics.uci.edu/ml/machine-learning-databases/statlog/german/ if necessary.
 
-    :param test_set: Proportion of the data to use as validation split (value between 0 and 1).
-    :return: Dataset and labels as pandas dataframes.
+    :param test_set: Proportion of the data to use as validation split (value between 0 and 1). Default is 0.3
+    :type test_set: float
+    :return: Dataset and labels as pandas dataframes. Returned as a tuple (x_train, y_train), (x_test, y_test)
     """
 
     url = 'https://archive.ics.uci.edu/ml/machine-learning-databases/statlog/german/german.data'
@@ -124,9 +128,10 @@ def _modify_german_dataset(data):
 
 def get_adult_dataset():
     """
-    Loads the UCI Adult dataset from `tests/datasets/adult` or downloads it if necessary.
+    Loads the UCI Adult dataset from `tests/datasets/adult` or downloads it from
+    https://archive.ics.uci.edu/ml/machine-learning-databases/adult/ if necessary.
 
-    :return: Dataset and labels as pandas dataframes.
+    :return: Dataset and labels as pandas dataframes. Returned as a tuple (x_train, y_train), (x_test, y_test)
     """
     features = ['age', 'workclass', 'fnlwgt', 'education', 'education-num', 'marital-status', 'occupation',
                 'relationship', 'race', 'sex', 'capital-gain', 'capital-loss', 'hours-per-week', 'native-country',
@@ -225,15 +230,20 @@ def _modify_adult_dataset(data):
 
 def get_nursery_dataset(raw: bool = True, test_set: float = 0.2, transform_social: bool = False):
     """
-    Loads the UCI Nursery dataset from `tests/datasets/nursery` or downloads it if necessary.
+    Loads the UCI Nursery dataset from `tests/datasets/nursery` or downloads it from
+    https://archive.ics.uci.edu/ml/machine-learning-databases/nursery/ if necessary.
 
     :param raw: `True` if no preprocessing should be applied to the data. Otherwise, categorical data is one-hot
                 encoded and data is scaled using sklearn's StandardScaler.
-    :param test_set: Proportion of the data to use as validation split. The value should be between 0 and 1.
+    :type raw: boolean
+    :param test_set: Proportion of the data to use as validation split. The value should be between 0 and 1. Default is
+                     0.2
+    :type test_set: float
     :param transform_social: If `True`, transforms the social feature to be binary for the purpose of attribute
                              inference. This is done by assigning the original value 'problematic' the new value 1, and
                              the other original values are assigned the new value 0.
-    :return: Dataset and labels as pandas dataframes.
+    :type transform_social: boolean
+    :return: Dataset and labels as pandas dataframes. Returned as a tuple (x_train, y_train), (x_test, y_test)
     """
     url = 'https://archive.ics.uci.edu/ml/machine-learning-databases/nursery/nursery.data'
     data_dir = '../datasets/nursery'
diff --git a/apt/utils/datasets/datasets.py b/apt/utils/datasets/datasets.py
index ff7c296..9383a2f 100644
--- a/apt/utils/datasets/datasets.py
+++ b/apt/utils/datasets/datasets.py
@@ -24,41 +24,6 @@ OUTPUT_DATA_ARRAY_TYPE = np.ndarray
 DATA_PANDAS_NUMPY_TYPE = Union[np.ndarray, pd.DataFrame]
 
 
-def array2numpy(self, arr: INPUT_DATA_ARRAY_TYPE) -> OUTPUT_DATA_ARRAY_TYPE:
-
-    """
-    converts from INPUT_DATA_ARRAY_TYPE to numpy array
-    """
-    if type(arr) == np.ndarray:
-        return arr
-    if type(arr) == pd.DataFrame or type(arr) == pd.Series:
-        self.is_pandas = True
-        return arr.to_numpy()
-    if isinstance(arr, list):
-        return np.array(arr)
-    if type(arr) == Tensor:
-        return arr.detach().cpu().numpy()
-
-    raise ValueError('Non supported type: ', type(arr).__name__)
-
-
-def array2torch_tensor(self, arr: INPUT_DATA_ARRAY_TYPE) -> Tensor:
-    """
-    converts from INPUT_DATA_ARRAY_TYPE to torch tensor array
-    """
-    if type(arr) == np.ndarray:
-        return torch.from_numpy(arr)
-    if type(arr) == pd.DataFrame or type(arr) == pd.Series:
-        self.is_pandas = True
-        return torch.from_numpy(arr.to_numpy())
-    if isinstance(arr, list):
-        return torch.tensor(arr)
-    if type(arr) == Tensor:
-        return arr
-
-    raise ValueError('Non supported type: ', type(arr).__name__)
-
-
 class Dataset(metaclass=ABCMeta):
     """Base Abstract Class for Dataset"""
 
@@ -68,36 +33,99 @@ class Dataset(metaclass=ABCMeta):
 
     @abstractmethod
     def get_samples(self) -> Collection[Any]:
-        """Return data samples"""
+        """
+        Return data samples
+
+        :return: the data samples
+        """
         pass
 
     @abstractmethod
     def get_labels(self) -> Collection[Any]:
-        """Return labels"""
+        """
+        Return labels
+
+        :return: the labels
+        """
         pass
 
+    def _array2numpy(self, arr: INPUT_DATA_ARRAY_TYPE) -> OUTPUT_DATA_ARRAY_TYPE:
+        """
+        Converts from INPUT_DATA_ARRAY_TYPE to numpy array
+
+        :param arr: the array to transform
+        :type arr: numpy array or pandas DataFrame or list or pytorch Tensor
+        :return: the array transformed into a numpy array
+        """
+        if type(arr) == np.ndarray:
+            return arr
+        if type(arr) == pd.DataFrame or type(arr) == pd.Series:
+            self.is_pandas = True
+            return arr.to_numpy()
+        if isinstance(arr, list):
+            return np.array(arr)
+        if type(arr) == Tensor:
+            return arr.detach().cpu().numpy()
+
+        raise ValueError('Non supported type: ', type(arr).__name__)
+
+    def _array2torch_tensor(self, arr: INPUT_DATA_ARRAY_TYPE) -> Tensor:
+        """
+        Converts from INPUT_DATA_ARRAY_TYPE to torch tensor array
+
+        :param arr: the array to transform
+        :type arr: numpy array or pandas DataFrame or list or pytorch Tensor
+        :return: the array transformed into a pytorch Tensor
+        """
+        if type(arr) == np.ndarray:
+            return torch.from_numpy(arr)
+        if type(arr) == pd.DataFrame or type(arr) == pd.Series:
+            self.is_pandas = True
+            return torch.from_numpy(arr.to_numpy())
+        if isinstance(arr, list):
+            return torch.tensor(arr)
+        if type(arr) == Tensor:
+            return arr
+
+        raise ValueError('Non supported type: ', type(arr).__name__)
+
 
 class StoredDataset(Dataset):
-    """Abstract Class for Storable Dataset"""
+    """Abstract Class for a Dataset that can be downloaded from a URL and stored in a file"""
 
     @abstractmethod
     def load_from_file(self, path: str):
-        """Load dataset from file"""
+        """
+        Load dataset from file
+
+        :param path: the path to the file
+        :type path: string
+        :return: None
+        """
         pass
 
     @abstractmethod
     def load(self, **kwargs):
-        """Load dataset"""
+        """
+        Load dataset
+
+        :return: None
+        """
         pass
 
     @staticmethod
-    def download(url: str, dest_path: str, filename: str, unzip: bool = False) -> None:
+    def download(url: str, dest_path: str, filename: str, unzip: Optional[bool] = False) -> None:
         """
         Download the dataset from URL
+
         :param url: dataset URL, the dataset will be requested from this URL
+        :type url: string
         :param dest_path: local dataset destination path
+        :type dest_path: string
         :param filename: local dataset filename
-        :param unzip: flag whether or not perform extraction
+        :type filename: string
+        :param unzip: flag whether or not perform extraction. Default is False.
+        :type unzip: boolean, optional
         :return: None
         """
         file_path = os.path.join(dest_path, filename)
@@ -115,12 +143,16 @@ class StoredDataset(Dataset):
             StoredDataset.extract_archive(zip_path=file_path, dest_path=dest_path, remove_archive=False)
 
     @staticmethod
-    def extract_archive(zip_path: str, dest_path=None, remove_archive=False):
+    def extract_archive(zip_path: str, dest_path: Optional[str] = None, remove_archive: Optional[bool] = False):
         """
         Extract dataset from archived file
+
         :param zip_path: path to archived file
+        :type zip_path: string
         :param dest_path: directory path to uncompress the file to
-        :param remove_archive: whether remove the archive file after uncompress (default False)
+        :type dest_path: string, optional
+        :param remove_archive: whether remove the archive file after uncompress. Default is False.
+        :type remove_archive: boolean, optional
         :return: None
         """
         logger.info("Extracting the dataset...")
@@ -134,15 +166,23 @@ class StoredDataset(Dataset):
         logger.info("Extracted the dataset")
 
     @staticmethod
-    def split_debug(datafile: str, dest_datafile: str, ratio: int, shuffle=True, delimiter=",", fmt=None) -> None:
+    def split_debug(datafile: str, dest_datafile: str, ratio: int, shuffle: Optional[bool] = True,
+                    delimiter: Optional[str] = ",", fmt: Optional[Union[str, list]] = None) -> None:
         """
         Split the data and take only a part of it
+
         :param datafile: dataset file path
+        :type datafile: string
         :param dest_datafile: destination path for the partial dataset file
+        :type dest_datafile: string
         :param ratio: part of the dataset to save
-        :param shuffle: whether to shuffle the data or not (default True)
-        :param delimiter: dataset delimiter (default ",")
-        :param fmt: format for the correct data saving
+        :type ratio: int
+        :param shuffle: whether to shuffle the data or not. Default is True.
+        :type shuffle: boolean, optional
+        :param delimiter: dataset delimiter. Default is ","
+        :type delimiter: string, optional
+        :param fmt: format for the correct data saving. As defined by numpy.savetxt(). Default is None.
+        :type fmt: string or sequence of strings, optional
         :return: None
         """
         if os.path.isfile(dest_datafile):
@@ -162,21 +202,23 @@ class StoredDataset(Dataset):
 
 
 class ArrayDataset(Dataset):
-    """Dataset that is based on x and y arrays (e.g., numpy/pandas/list...)"""
+    """
+    Dataset that is based on x and y arrays (e.g., numpy/pandas/list...)
+
+    :param x: collection of data samples
+    :type x: numpy array or pandas DataFrame or list or pytorch Tensor
+    :param y: collection of labels
+    :type y: numpy array or pandas DataFrame or list or pytorch Tensor, optional
+    :param feature_names: The feature names, in the order that they appear in the data
+    :type feature_names: list of strings, optional
+    """
 
     def __init__(self, x: INPUT_DATA_ARRAY_TYPE, y: Optional[INPUT_DATA_ARRAY_TYPE] = None,
-                 features_names: Optional = None, **kwargs):
-        """
-        ArrayDataset constructor.
-        :param x: collection of data samples
-        :param y: collection of labels (optional)
-        :param feature_names: list of str, The feature names, in the order that they appear in the data (optional)
-        :param kwargs: dataset parameters
-        """
+                 features_names: Optional[list] = None, **kwargs):
         self.is_pandas = False
         self.features_names = features_names
-        self._y = array2numpy(self, y) if y is not None else None
-        self._x = array2numpy(self, x)
+        self._y = self._array2numpy(y) if y is not None else None
+        self._x = self._array2numpy(x)
         if self.is_pandas:
             if features_names and not np.array_equal(features_names, x.columns):
                 raise ValueError("The supplied features are not the same as in the data features")
@@ -186,51 +228,80 @@ class ArrayDataset(Dataset):
             raise ValueError('Non equivalent lengths of x and y')
 
     def get_samples(self) -> OUTPUT_DATA_ARRAY_TYPE:
-        """Return data samples as numpy array"""
+        """
+        Get data samples
+
+        :return: data samples as numpy array
+        """
         return self._x
 
     def get_labels(self) -> OUTPUT_DATA_ARRAY_TYPE:
-        """Return labels as numpy array"""
+        """
+        Get labels
+
+        :return: labels as numpy array
+        """
         return self._y
 
 
 class PytorchData(Dataset):
+    """
+    Dataset for pytorch models.
 
+    :param x: collection of data samples
+    :type x: numpy array or pandas DataFrame or list or pytorch Tensor
+    :param y: collection of labels
+    :type y: numpy array or pandas DataFrame or list or pytorch Tensor, optional
+    """
     def __init__(self, x: INPUT_DATA_ARRAY_TYPE, y: Optional[INPUT_DATA_ARRAY_TYPE] = None, **kwargs):
-        """
-        PytorchData constructor.
-        :param x: collection of data samples
-        :param y: collection of labels (optional)
-        :param kwargs: dataset parameters
-        """
         self.is_pandas = False
-        self._y = array2torch_tensor(self, y) if y is not None else None
-        self._x = array2torch_tensor(self, x)
+        self._y = self._array2torch_tensor(y) if y is not None else None
+        self._x = self._array2torch_tensor(x)
         if self.is_pandas:
             self.features_names = x.columns
 
         if y is not None and len(self._x) != len(self._y):
             raise ValueError('Non equivalent lengths of x and y')
 
-
         if self._y is not None:
             self.__getitem__ = self.get_item
         else:
             self.__getitem__ = self.get_sample_item
 
-
     def get_samples(self) -> OUTPUT_DATA_ARRAY_TYPE:
-        """Return data samples as numpy array"""
-        return array2numpy(self._x)
+        """
+        Get data samples.
+
+        :return: samples as numpy array
+        """
+        return self._array2numpy(self._x)
 
     def get_labels(self) -> OUTPUT_DATA_ARRAY_TYPE:
-        """Return labels as numpy array"""
-        return array2numpy(self._y) if self._y is not None else None
+        """
+        Get labels.
 
-    def get_sample_item(self, idx) -> Tensor:
+        :return: labels as numpy array
+        """
+        return self._array2numpy(self._y) if self._y is not None else None
+
+    def get_sample_item(self, idx: int) -> Tensor:
+        """
+        Get the sample according to the given index
+
+        :param idx: the index of the sample to return
+        :type idx: int
+        :return: the sample as a pytorch Tensor
+        """
         return self.x[idx]
 
-    def get_item(self, idx) -> Tensor:
+    def get_item(self, idx: int) -> Tensor:
+        """
+        Get the sample and label according to the given index
+
+        :param idx: the index of the sample to return
+        :type idx: int
+        :return: the sample and label as pytorch Tensors. Returned as a tuple (sample, label)
+        """
         sample, label = self.x[idx], self.y[idx]
         return sample, label
 
@@ -246,8 +317,10 @@ class DatasetFactory:
     def register(cls, name: str) -> Callable:
         """
         Class method to register Dataset to the internal registry
+
         :param name: dataset name
-        :return:
+        :type name: string
+        :return: a Callable that returns the registered dataset class
         """
 
         def inner_wrapper(wrapped_class: Dataset) -> Any:
@@ -262,11 +335,15 @@ class DatasetFactory:
     def create_dataset(cls, name: str, **kwargs) -> Dataset:
         """
         Factory command to create dataset instance.
+
         This method gets the appropriate Dataset class from the registry
         and creates an instance of it, while passing in the parameters
         given in ``kwargs``.
+
         :param name: The name of the dataset to create.
+        :type name: string
         :param kwargs: dataset parameters
+        :type kwargs: keyword arguments as expected by the class
         :return: An instance of the dataset that is created.
         """
         if name not in cls.registry:
@@ -280,13 +357,19 @@ class DatasetFactory:
 
 
 class Data:
-    def __init__(self, train: Dataset = None, test: Dataset = None, **kwargs):
+    """
+    Class for storing train and test datasets.
+
+    :param train: the training set
+    :type train: `Dataset`
+    :param test: the test set
+    :type test: `Dataset`, optional
+    """
+    def __init__(self, train: Dataset = None, test: Optional[Dataset] = None, **kwargs):
         """
         Data class constructor.
-        The class stores train and test datasets.
-        If neither of the datasets was provided,
-        Both train and test datasets will be create using
-        DatasetFactory to create a dataset instance
+
+        If neither of the datasets was provided, both train and test datasets will be created using `DatasetFactory`.
         """
         if train or test:
             self.train = train
@@ -296,25 +379,49 @@ class Data:
             self.test = DatasetFactory.create_dataset(train=False, **kwargs)
 
     def get_train_set(self) -> Dataset:
-        """Return train DatasetBase"""
+        """
+        Get training set
+
+        :return: training 'Dataset`
+        """
         return self.train
 
     def get_test_set(self) -> Dataset:
-        """Return test DatasetBase"""
+        """
+        Get test set
+
+        :return: test 'Dataset`
+        """
         return self.test
 
     def get_train_samples(self) -> Collection[Any]:
-        """Return train set samples"""
+        """
+        Get train set samples
+
+        :return: training samples
+        """
         return self.train.get_samples()
 
     def get_train_labels(self) -> Collection[Any]:
-        """Return train set labels"""
+        """
+        Get train set labels
+
+        :return: training labels
+        """
         return self.train.get_labels()
 
     def get_test_samples(self) -> Collection[Any]:
-        """Return test set samples"""
+        """
+        Get test set samples
+
+        :return: test samples
+        """
         return self.test.get_samples()
 
     def get_test_labels(self) -> Collection[Any]:
-        """Return test set labels"""
+        """
+        Get test set labels
+
+        :return: test labels
+        """
         return self.test.get_labels()
diff --git a/apt/utils/models/model.py b/apt/utils/models/model.py
index 9616459..c362fb5 100644
--- a/apt/utils/models/model.py
+++ b/apt/utils/models/model.py
@@ -14,24 +14,25 @@ class ModelOutputType(Enum):
 class Model(metaclass=ABCMeta):
     """
     Abstract base class for ML model wrappers.
+
+    :param model: The original model object (of the underlying ML framework)
+    :type model: framework-specific model object
+    :param output_type: The type of output the model yields (vector/label only for classifiers,
+                        value for regressors)
+    :type output_type: `ModelOutputType`
+    :param black_box_access: Boolean describing the type of deployment of the model (when in production).
+                             Set to True if the model is only available via query (API) access, i.e.,
+                             only the outputs of the model are exposed, and False if the model internals
+                             are also available. Default is True.
+    :type black_box_access: boolean, optional
+    :param unlimited_queries: If black_box_access is True, this boolean indicates whether a user can perform
+                              unlimited queries to the model API or whether there is a limit to the number of
+                              queries that can be submitted. Default is True.
+    :type unlimited_queries: boolean, optional
     """
 
     def __init__(self, model: Any, output_type: ModelOutputType, black_box_access: Optional[bool] = True,
                  unlimited_queries: Optional[bool] = True, **kwargs):
-        """
-        Initialize a `Model` wrapper object.
-
-        :param model: The original model object (of the underlying ML framework)
-        :param output_type: The type of output the model yields (vector/label only for classifiers,
-                            value for regressors)
-        :param black_box_access: Boolean describing the type of deployment of the model (when in production).
-                                 Set to True if the model is only available via query (API) access, i.e.,
-                                 only the outputs of the model are exposed, and False if the model internals
-                                 are also available. Optional, Default is True.
-        :param unlimited_queries: If black_box_access is True, this boolean indicates whether a user can perform
-                                  unlimited queries to the model API or whether there is a limit to the number of
-                                  queries that can be submitted. Optional, Default is True.
-        """
         self._model = model
         self._output_type = output_type
         self._black_box_access = black_box_access
@@ -54,7 +55,7 @@ class Model(metaclass=ABCMeta):
 
         :param x: Input samples.
         :type x: `np.ndarray` or `pandas.DataFrame`
-        :return: Predictions from the model.
+        :return: Predictions from the model as numpy array.
         """
         raise NotImplementedError
 
@@ -65,13 +66,14 @@ class Model(metaclass=ABCMeta):
 
         :param test_data: Test data.
         :type train_data: `Dataset`
+        :return: the score as float (for classifiers, between 0 and 1)
         """
         return NotImplementedError
 
     @property
     def model(self) -> Any:
         """
-        Return the model.
+        Return the underlying model.
 
         :return: The model.
         """
@@ -89,21 +91,19 @@ class Model(metaclass=ABCMeta):
     @property
     def black_box_access(self) -> bool:
         """
-        Return True if the model is only available via query (API) access, i.e.,
-        only the outputs of the model are exposed, and False if the model internals are also available.
+        Return whether the model is only available via query (API) access, i.e.,
+        only the outputs of the model are exposed, or if the model internals are also available.
 
-        :return: True if the model is only available via query (API) access, i.e.,
-                 only the outputs of the model are exposed, and False if the model internals are also available.
+        :return: True if the model is only available via query (API) access, otherwise False.
         """
         return self._black_box_access
 
     @property
     def unlimited_queries(self) -> bool:
         """
-        If black_box_access is True, Return whether a user can perform unlimited queries to the model API
+        If black_box_access is True, return whether a user can perform unlimited queries to the model API
         or whether there is a limit to the number of queries that can be submitted.
 
-        :return: If black_box_access is True, Return whether a user can perform unlimited queries to the model API
-                 or whether there is a limit to the number of queries that can be submitted.
+        :return: True if a user can perform unlimited queries to the model API, otherwise False.
         """
         return self._unlimited_queries
diff --git a/apt/utils/models/sklearn_model.py b/apt/utils/models/sklearn_model.py
index f7afaa6..a64058e 100644
--- a/apt/utils/models/sklearn_model.py
+++ b/apt/utils/models/sklearn_model.py
@@ -22,6 +22,7 @@ class SklearnModel(Model):
 
         :param test_data: Test data.
         :type train_data: `Dataset`
+        :return: the score as float (for classifiers, between 0 and 1)
         """
         return self.model.score(test_data.get_samples(), test_data.get_labels(), **kwargs)
 
@@ -29,23 +30,23 @@ class SklearnModel(Model):
 class SklearnClassifier(SklearnModel):
     """
     Wrapper class for scikitlearn classification models.
+
+    :param model: The original sklearn model object.
+    :type model: scikitlearn classifier object
+    :param output_type: The type of output the model yields (vector/label only)
+    :type output_type: `ModelOutputType`
+    :param black_box_access: Boolean describing the type of deployment of the model (when in production).
+                             Set to True if the model is only available via query (API) access, i.e.,
+                             only the outputs of the model are exposed, and False if the model internals
+                             are also available. Default is True.
+    :type black_box_access: boolean, optional
+    :param unlimited_queries: If black_box_access is True, this boolean indicates whether a user can perform
+                              unlimited queries to the model API or whether there is a limit to the number of
+                              queries that can be submitted. Default is True.
+    :type unlimited_queries: boolean, optional
     """
     def __init__(self, model: BaseEstimator, output_type: ModelOutputType, black_box_access: Optional[bool] = True,
                  unlimited_queries: Optional[bool] = True, **kwargs):
-        """
-        Initialize a `SklearnClassifier` wrapper object.
-
-        :param model: The original sklearn model object.
-        :param output_type: The type of output the model yields (vector/label only for classifiers,
-                            value for regressors)
-        :param black_box_access: Boolean describing the type of deployment of the model (when in production).
-                                 Set to True if the model is only available via query (API) access, i.e.,
-                                 only the outputs of the model are exposed, and False if the model internals
-                                 are also available. Optional, Default is True.
-        :param unlimited_queries: If black_box_access is True, this boolean indicates whether a user can perform
-                                  unlimited queries to the model API or whether there is a limit to the number of
-                                  queries that can be submitted. Optional, Default is True.
-        """
         super().__init__(model, output_type, black_box_access, unlimited_queries, **kwargs)
         self._art_model = ArtSklearnClassifier(model)
 
@@ -55,6 +56,7 @@ class SklearnClassifier(SklearnModel):
 
         :param train_data: Training data.
         :type train_data: `Dataset`
+        :return: None
         """
         encoder = OneHotEncoder(sparse=False)
         y_encoded = encoder.fit_transform(train_data.get_labels().reshape(-1, 1))
@@ -65,8 +67,8 @@ class SklearnClassifier(SklearnModel):
         Perform predictions using the model for input `x`.
 
         :param x: Input samples.
-        :type x: `np.ndarray` or `pandas.DataFrame`
-        :return: Predictions from the model (class probabilities, if supported).
+        :type x: `Dataset`
+        :return: Predictions from the model as numpy array (class probabilities, if supported).
         """
         return self._art_model.predict(x, **kwargs)
 
@@ -74,21 +76,21 @@ class SklearnClassifier(SklearnModel):
 class SklearnRegressor(SklearnModel):
     """
     Wrapper class for scikitlearn regression models.
+
+    :param model: The original sklearn model object.
+    :type model: scikitlearn regressor object
+    :param black_box_access: Boolean describing the type of deployment of the model (when in production).
+                             Set to True if the model is only available via query (API) access, i.e.,
+                             only the outputs of the model are exposed, and False if the model internals
+                             are also available. Default is True.
+    :type black_box_access: boolean, optional
+    :param unlimited_queries: If black_box_access is True, this boolean indicates whether a user can perform
+                              unlimited queries to the model API or whether there is a limit to the number of
+                              queries that can be submitted. Default is True.
+    :type unlimited_queries: boolean, optional
     """
     def __init__(self, model: BaseEstimator, black_box_access: Optional[bool] = True,
                  unlimited_queries: Optional[bool] = True, **kwargs):
-        """
-        Initialize a `SklearnRegressor` wrapper object.
-
-        :param model: The original sklearn model object.
-        :param black_box_access: Boolean describing the type of deployment of the model (when in production).
-                                 Set to True if the model is only available via query (API) access, i.e.,
-                                 only the outputs of the model are exposed, and False if the model internals
-                                 are also available. Optional, Default is True.
-        :param unlimited_queries: If black_box_access is True, this boolean indicates whether a user can perform
-                                  unlimited queries to the model API or whether there is a limit to the number of
-                                  queries that can be submitted. Optional, Default is True.
-        """
         super().__init__(model, ModelOutputType.REGRESSOR_SCALAR, black_box_access, unlimited_queries, **kwargs)
         self._art_model = ScikitlearnRegressor(model)
 
@@ -98,6 +100,7 @@ class SklearnRegressor(SklearnModel):
 
         :param train_data: Training data.
         :type train_data: `Dataset`
+        :return: None
         """
         self._art_model.fit(train_data.get_samples(), train_data.get_labels(), **kwargs)
 
@@ -106,7 +109,7 @@ class SklearnRegressor(SklearnModel):
         Perform predictions using the model for input `x`.
 
         :param x: Input samples.
-        :type x: `np.ndarray` or `pandas.DataFrame`
-        :return: Predictions from the model.
+        :type x: `Dataset`
+        :return: Predictions from the model as numpy array.
         """
         return self._art_model.predict(x, **kwargs)
diff --git a/docs/conf.py b/docs/conf.py
index 6452871..6c49482 100644
--- a/docs/conf.py
+++ b/docs/conf.py
@@ -32,8 +32,11 @@ master_doc = 'index'
 # extensions coming with Sphinx (named 'sphinx.ext.*') or your custom
 # ones.
 extensions = [
+    'sphinx.ext.duration',
+    'sphinx.ext.doctest',
     'sphinx.ext.autodoc',
-    'sphinx.ext.napoleon'
+    'sphinx.ext.autosummary',
+    'sphinx.ext.intersphinx',
 ]
 
 # Add any paths that contain templates here, relative to this directory.
@@ -50,7 +53,7 @@ exclude_patterns = []
 # The theme to use for HTML and HTML Help pages.  See the documentation for
 # a list of builtin themes.
 #
-html_theme = 'alabaster'
+html_theme = 'pyramid'
 
 # Add any paths that contain custom static files (such as style sheets) here,
 # relative to this directory. They are copied after the builtin static files,
diff --git a/docs/source/apt.utils.datasets.rst b/docs/source/apt.utils.datasets.rst
new file mode 100644
index 0000000..f40bbdf
--- /dev/null
+++ b/docs/source/apt.utils.datasets.rst
@@ -0,0 +1,22 @@
+apt.utils.datasets package
+==========================
+
+Submodules
+----------
+
+apt.utils.datasets.datasets module
+----------------------------------
+
+.. automodule:: apt.utils.datasets.datasets
+   :members:
+   :undoc-members:
+   :show-inheritance:
+
+
+Module contents
+---------------
+
+.. automodule:: apt.utils.datasets
+   :members:
+   :undoc-members:
+   :show-inheritance:
diff --git a/docs/source/apt.utils.models.rst b/docs/source/apt.utils.models.rst
new file mode 100644
index 0000000..de4a5b1
--- /dev/null
+++ b/docs/source/apt.utils.models.rst
@@ -0,0 +1,30 @@
+apt.utils.models package
+========================
+
+Submodules
+----------
+
+apt.utils.models.model module
+-----------------------------
+
+.. automodule:: apt.utils.models.model
+   :members:
+   :undoc-members:
+   :show-inheritance:
+
+apt.utils.models.sklearn\_model module
+--------------------------------------
+
+.. automodule:: apt.utils.models.sklearn_model
+   :members:
+   :undoc-members:
+   :show-inheritance:
+
+
+Module contents
+---------------
+
+.. automodule:: apt.utils.models
+   :members:
+   :undoc-members:
+   :show-inheritance:
diff --git a/docs/source/apt.utils.rst b/docs/source/apt.utils.rst
new file mode 100644
index 0000000..4a6ce11
--- /dev/null
+++ b/docs/source/apt.utils.rst
@@ -0,0 +1,31 @@
+apt.utils package
+=================
+
+Subpackages
+-----------
+
+.. toctree::
+   :maxdepth: 4
+
+   apt.utils.datasets
+   apt.utils.models
+
+Submodules
+----------
+
+apt.utils.dataset\_utils module
+-------------------------------
+
+.. automodule:: apt.utils.dataset_utils
+   :members:
+   :undoc-members:
+   :show-inheritance:
+
+
+Module contents
+---------------
+
+.. automodule:: apt.utils
+   :members:
+   :undoc-members:
+   :show-inheritance:
diff --git a/requirements.txt b/requirements.txt
index e1133d4..f841d7c 100644
--- a/requirements.txt
+++ b/requirements.txt
@@ -2,6 +2,7 @@ numpy==1.21.0
 pandas==1.1.0
 scipy==1.4.1
 scikit-learn==0.22.2
+torch>=1.8.0
 adversarial-robustness-toolbox>=1.10.1
 
 # testing

From fe676fa426c9a66e973d0e7a97348798ed661b86 Mon Sep 17 00:00:00 2001
From: abigailgold <57357634+abigailgold@users.noreply.github.com>
Date: Thu, 12 May 2022 15:44:29 +0300
Subject: [PATCH 09/26] New model wrappers (#32)

* keras wrapper + blackbox classifier wrapper (fix #7)

* fix error in NCP calculation

* Update notebooks

* Fix #25 (incorrect attack_feature indexes for social feature in notebook)

* Consistent naming of internal parameters
---
 apt/anonymization/anonymizer.py               |  16 +-
 apt/minimization/minimizer.py                 | 242 ++++----
 apt/utils/dataset_utils.py                    |  15 +-
 apt/utils/datasets/datasets.py                |  16 +-
 apt/utils/models/__init__.py                  |   3 +-
 apt/utils/models/keras_model.py               | 149 +++++
 apt/utils/models/model.py                     |  99 ++-
 apt/utils/models/sklearn_model.py             |  15 +-
 ...bute_inference_anonymization_nursery.ipynb | 575 +++++++++++++++---
 notebooks/minimization_adult.ipynb            |  78 +--
 notebooks/minimization_diabetes_reg.ipynb     | 173 +++---
 notebooks/minimization_german_credit.ipynb    | 217 +++----
 tests/test_anonymizer.py                      |  20 +-
 tests/test_minimizer.py                       | 391 +++++++-----
 tests/test_model.py                           |  54 +-
 15 files changed, 1407 insertions(+), 656 deletions(-)
 create mode 100644 apt/utils/models/keras_model.py

diff --git a/apt/anonymization/anonymizer.py b/apt/anonymization/anonymizer.py
index 909cae7..52b4055 100644
--- a/apt/anonymization/anonymizer.py
+++ b/apt/anonymization/anonymizer.py
@@ -101,11 +101,11 @@ class Anonymize:
             # build DT just on QI features
             x_anonymizer_train = x_prepared[:, self.quasi_identifiers]
         if self.is_regression:
-            self.anonymizer = DecisionTreeRegressor(random_state=10, min_samples_split=2, min_samples_leaf=self.k)
+            self._anonymizer = DecisionTreeRegressor(random_state=10, min_samples_split=2, min_samples_leaf=self.k)
         else:
-            self.anonymizer = DecisionTreeClassifier(random_state=10, min_samples_split=2, min_samples_leaf=self.k)
+            self._anonymizer = DecisionTreeClassifier(random_state=10, min_samples_split=2, min_samples_leaf=self.k)
 
-        self.anonymizer.fit(x_anonymizer_train, y)
+        self._anonymizer.fit(x_anonymizer_train, y)
         cells_by_id = self._calculate_cells(x, x_anonymizer_train)
         return self._anonymize_data(x, x_anonymizer_train, cells_by_id)
 
@@ -113,16 +113,16 @@ class Anonymize:
         # x is original data, x_anonymizer_train is only QIs + 1-hot encoded
         cells_by_id = {}
         leaves = []
-        for node, feature in enumerate(self.anonymizer.tree_.feature):
+        for node, feature in enumerate(self._anonymizer.tree_.feature):
             if feature == -2:  # leaf node
                 leaves.append(node)
-                hist = [int(i) for i in self.anonymizer.tree_.value[node][0]]
+                hist = [int(i) for i in self._anonymizer.tree_.value[node][0]]
                 # TODO we may change the method for choosing representative for cell
                 # label_hist = self.anonymizer.tree_.value[node][0]
                 # label = int(self.anonymizer.classes_[np.argmax(label_hist)])
                 cell = {'label': 1, 'hist': hist, 'id': int(node)}
                 cells_by_id[cell['id']] = cell
-        self.nodes = leaves
+        self._nodes = leaves
         self._find_representatives(x, x_anonymizer_train, cells_by_id.values())
         return cells_by_id
 
@@ -153,8 +153,8 @@ class Anonymize:
                     cell['representative'][feature] = min_value
 
     def _find_sample_nodes(self, samples):
-        paths = self.anonymizer.decision_path(samples).toarray()
-        node_set = set(self.nodes)
+        paths = self._anonymizer.decision_path(samples).toarray()
+        node_set = set(self._nodes)
         return [(list(set([i for i, v in enumerate(p) if v == 1]) & node_set))[0] for p in paths]
 
     def _find_sample_cells(self, samples, cells_by_id):
diff --git a/apt/minimization/minimizer.py b/apt/minimization/minimizer.py
index 7d538b0..df70a3a 100644
--- a/apt/minimization/minimizer.py
+++ b/apt/minimization/minimizer.py
@@ -12,7 +12,7 @@ from sklearn.compose import ColumnTransformer
 from sklearn.impute import SimpleImputer
 from sklearn.pipeline import Pipeline
 from sklearn.preprocessing import OneHotEncoder
-from sklearn.utils.validation import check_X_y, check_array, check_is_fitted
+from sklearn.utils.validation import check_is_fitted
 from sklearn.tree import DecisionTreeClassifier, DecisionTreeRegressor
 from sklearn.model_selection import train_test_split
 
@@ -68,7 +68,7 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
             if is_regression:
                 self.estimator = SklearnRegressor(estimator)
             else:
-                self.estimator = SklearnClassifier(estimator, ModelOutputType.CLASSIFIER_VECTOR)
+                self.estimator = SklearnClassifier(estimator, ModelOutputType.CLASSIFIER_PROBABILITIES)
         self.target_accuracy = target_accuracy
         self.cells = cells
         self.categorical_features = []
@@ -124,7 +124,16 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
                                  'categories' that contains sub-groups of categories for categorical features, and
                                  'untouched' that contains the features that could not be generalized.
         """
-        return self.generalizations_
+        return self._generalizations
+
+    @property
+    def ncp(self):
+        """
+        Return the NCP score of the generalizations.
+
+        :return: ncp score as float.
+        """
+        return self._ncp
 
     def fit_transform(self, X: Optional[DATA_PANDAS_NUMPY_TYPE] = None, y: Optional[DATA_PANDAS_NUMPY_TYPE] = None,
                       features_names: Optional[list] = None, dataset: Optional[ArrayDataset] = None):
@@ -172,27 +181,20 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
                 dataset = ArrayDataset(X, y, features_names)
 
         if dataset and dataset.get_samples() is not None and dataset.get_labels() is not None:
-            self.n_features_ = dataset.get_samples().shape[1]
-
+            self._n_features = dataset.get_samples().shape[1]
         elif dataset and dataset.features_names:
-            self.n_features_ = len(dataset.features_names)
+            self._n_features = len(dataset.features_names)
         else:
-            self.n_features_ = 0
+            self._n_features = 0
 
         if dataset and dataset.features_names:
             self._features = dataset.features_names
         # if features is None, use numbers instead of names
-        elif self.n_features_ != 0:
-            self._features = [str(i) for i in range(self.n_features_)]
+        elif self._n_features != 0:
+            self._features = [str(i) for i in range(self._n_features)]
         else:
             self._features = None
 
-        if self.cells:
-            self.cells_ = self.cells
-        else:
-            self.cells_ = {}
-        self.categorical_values = {}
-
         # Going to fit
         # (currently not dealing with option to fit with only X and y and no estimator)
         if self.estimator and dataset and dataset.get_samples() is not None and dataset.get_labels() is not None:
@@ -231,28 +233,10 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
                         fd['max'] = max(values)
                         fd['range'] = max(values) - min(values)
                     else:
-                        fd['range'] = len(values)
+                        fd['range'] = len(np.unique(values))
                     feature_data[feature] = fd
 
             # prepare data for DT
-            categorical_features = [f for f in self._features if f in self.categorical_features and
-                                    f in self.features_to_minimize]
-
-            numeric_transformer = Pipeline(
-                steps=[('imputer', SimpleImputer(strategy='constant', fill_value=0))]
-            )
-
-            numeric_features = [f for f in self._features if f not in self.categorical_features and
-                                f in self.features_to_minimize]
-            categorical_transformer = OneHotEncoder(handle_unknown="ignore", sparse=False)
-
-            preprocessor_QI_features = ColumnTransformer(
-                transformers=[
-                    ("num", numeric_transformer, numeric_features),
-                    ("cat", categorical_transformer, categorical_features),
-                ]
-            )
-            preprocessor_QI_features.fit(x_QI)
 
             # preprocessor to fit data that have features not included in QI (to get accuracy)
             numeric_features = [f for f in self._features if f not in self.categorical_features]
@@ -267,44 +251,68 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
                 ]
             )
             preprocessor.fit(x)
-            x_prepared = preprocessor.transform(X_train)
+
             if self.train_only_QI:
+                categorical_features = [f for f in self._features if f in self.categorical_features and
+                                        f in self.features_to_minimize]
+
+                numeric_transformer = Pipeline(
+                        steps=[('imputer', SimpleImputer(strategy='constant', fill_value=0))]
+                )
+
+                numeric_features = [f for f in self._features if f not in self.categorical_features and
+                                    f in self.features_to_minimize]
+                categorical_transformer = OneHotEncoder(handle_unknown="ignore", sparse=False)
+
+                preprocessor_QI_features = ColumnTransformer(
+                        transformers=[
+                            ("num", numeric_transformer, numeric_features),
+                            ("cat", categorical_transformer, categorical_features),
+                        ]
+                )
+                preprocessor_QI_features.fit(x_QI)
                 x_prepared = preprocessor_QI_features.transform(X_train_QI)
+            else:
+                x_prepared = preprocessor.transform(X_train)
 
             self._preprocessor = preprocessor
 
-            self.cells_ = {}
+            self.cells = []
+            self._categorical_values = {}
+
             if self.is_regression:
-                self.dt_ = DecisionTreeRegressor(random_state=10, min_samples_split=2, min_samples_leaf=1)
+                self._dt = DecisionTreeRegressor(random_state=10, min_samples_split=2, min_samples_leaf=1)
             else:
-                self.dt_ = DecisionTreeClassifier(random_state=0, min_samples_split=2,
+                self._dt = DecisionTreeClassifier(random_state=0, min_samples_split=2,
                                                   min_samples_leaf=1)
-            self.dt_.fit(x_prepared, y_train)
+            self._dt.fit(x_prepared, y_train)
+
             self._modify_categorical_features(used_data)
 
-            x_prepared = pd.DataFrame(x_prepared, columns=self.categorical_data.columns)
+            x_prepared = pd.DataFrame(x_prepared, columns=self._categorical_data.columns)
 
             self._calculate_cells()
             self._modify_cells()
             # features that are not from QI should not be part of generalizations
             for feature in self._features:
                 if feature not in self.features_to_minimize:
-                    self._remove_feature_from_cells(self.cells_, self.cells_by_id_, feature)
+                    self._remove_feature_from_cells(self.cells, self._cells_by_id, feature)
 
             nodes = self._get_nodes_level(0)
             self._attach_cells_representatives(x_prepared, used_X_train, y_train, nodes)
 
-            # self.cells_ currently holds the generalization created from the tree leaves
+            # self._cells currently holds the generalization created from the tree leaves
             self._calculate_generalizations()
 
             # apply generalizations to test data
-            x_prepared_test = preprocessor.transform(X_test)
             if self.train_only_QI:
                 x_prepared_test = preprocessor_QI_features.transform(X_test_QI)
+            else:
+                x_prepared_test = preprocessor.transform(X_test)
 
-            x_prepared_test = pd.DataFrame(x_prepared_test, index=X_test.index, columns=self.categorical_data.columns)
+            x_prepared_test = pd.DataFrame(x_prepared_test, index=X_test.index, columns=self._categorical_data.columns)
 
-            generalized = self._generalize(X_test, x_prepared_test, nodes, self.cells_, self.cells_by_id_)
+            generalized = self._generalize(X_test, x_prepared_test, nodes, self.cells, self._cells_by_id)
 
             # check accuracy
             accuracy = self.estimator.score(ArrayDataset(preprocessor.transform(generalized), y_test))
@@ -317,22 +325,22 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
                 level = 1
                 while accuracy > self.target_accuracy:
                     try:
-                        cells_previous_iter = self.cells_
-                        generalization_prev_iter = self.generalizations_
-                        cells_by_id_prev = self.cells_by_id_
+                        cells_previous_iter = self.cells
+                        generalization_prev_iter = self._generalizations
+                        cells_by_id_prev = self._cells_by_id
                         nodes = self._get_nodes_level(level)
                         self._calculate_level_cells(level)
                         self._attach_cells_representatives(x_prepared, used_X_train, y_train, nodes)
 
                         self._calculate_generalizations()
-                        generalized = self._generalize(X_test, x_prepared_test, nodes, self.cells_,
-                                                       self.cells_by_id_)
+                        generalized = self._generalize(X_test, x_prepared_test, nodes, self.cells,
+                                                       self._cells_by_id)
                         accuracy = self.estimator.score(ArrayDataset(preprocessor.transform(generalized), y_test))
                         # if accuracy passed threshold roll back to previous iteration generalizations
                         if accuracy < self.target_accuracy:
-                            self.cells_ = cells_previous_iter
-                            self.generalizations_ = generalization_prev_iter
-                            self.cells_by_id_ = cells_by_id_prev
+                            self.cells = cells_previous_iter
+                            self._generalizations = generalization_prev_iter
+                            self._cells_by_id = cells_by_id_prev
                             break
                         else:
                             print('Pruned tree to level: %d, new relative accuracy: %f' % (level, accuracy))
@@ -352,14 +360,14 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
                         break
 
                     self._calculate_generalizations()
-                    generalized = self._generalize(X_test, x_prepared_test, nodes, self.cells_, self.cells_by_id_)
+                    generalized = self._generalize(X_test, x_prepared_test, nodes, self.cells, self._cells_by_id)
                     accuracy = self.estimator.score(ArrayDataset(preprocessor.transform(generalized), y_test))
                     print('Removed feature: %s, new relative accuracy: %f' % (removed_feature, accuracy))
 
-            # self.cells_ currently holds the chosen generalization based on target accuracy
+            # self._cells currently holds the chosen generalization based on target accuracy
 
             # calculate iLoss
-            self.ncp_ = self._calculate_ncp(X_test, self.generalizations_, feature_data)
+            self._ncp = self._calculate_ncp(X_test, self._generalizations, feature_data)
 
         # Return the transformer
         return self
@@ -398,7 +406,7 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
         if dataset and dataset.get_samples() is not None:
             x = pd.DataFrame(dataset.get_samples(), columns=self._features)
 
-        if x.shape[1] != self.n_features_ and self.n_features_ != 0:
+        if x.shape[1] != self._n_features and self._n_features != 0:
             raise ValueError('Shape of input is different from what was seen'
                              'in `fit`')
 
@@ -410,23 +418,23 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
         mapped = np.zeros(x.shape[0])  # to mark records we already mapped
 
         # iterate over cells (leaves in decision tree)
-        for i in range(len(self.cells_)):
+        for i in range(len(self.cells)):
             # Copy the representatives from the cells into another data structure:
             # iterate over features in test data
             for feature in self._features:
                 # if feature has a representative value in the cell and should not
                 # be left untouched, take the representative value
-                if feature in self.cells_[i]['representative'] and \
-                        ('untouched' not in self.cells_[i]
-                         or feature not in self.cells_[i]['untouched']):
-                    representatives.loc[i, feature] = self.cells_[i]['representative'][feature]
+                if feature in self.cells[i]['representative'] and \
+                        ('untouched' not in self.cells[i]
+                         or feature not in self.cells[i]['untouched']):
+                    representatives.loc[i, feature] = self.cells[i]['representative'][feature]
                 # else, drop the feature (removes from representatives columns that
                 # do not have a representative value or should remain untouched)
                 elif feature in representatives.columns.tolist():
                     representatives = representatives.drop(feature, axis=1)
 
             # get the indexes of all records that map to this cell
-            indexes = self._get_record_indexes_for_cell(x, self.cells_[i], mapped)
+            indexes = self._get_record_indexes_for_cell(x, self.cells[i], mapped)
 
             # replace the values in the representative columns with the representative
             # values (leaves others untouched)
@@ -467,8 +475,8 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
         return True
 
     def _modify_categorical_features(self, X):
-        self.categorical_values = {}
-        self.oneHotVectorFeaturesToFeatures = {}
+        self._categorical_values = {}
+        self._one_hot_vector_features_to_features = {}
         features_to_remove = []
         used_features = self._features
         if self.train_only_QI:
@@ -478,17 +486,17 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
                 try:
                     all_values = X.loc[:, feature]
                     values = list(all_values.unique())
-                    self.categorical_values[feature] = values
+                    self._categorical_values[feature] = values
                     X[feature] = pd.Categorical(X.loc[:, feature], categories=values, ordered=False)
                     ohe = pd.get_dummies(X[feature], prefix=feature)
-                    for oneHotVectorFeature in ohe.columns:
-                        self.oneHotVectorFeaturesToFeatures[oneHotVectorFeature] = feature
+                    for one_hot_vector_feature in ohe.columns:
+                        self._one_hot_vector_features_to_features[one_hot_vector_feature] = feature
                     X = pd.concat([X, ohe], axis=1)
                     features_to_remove.append(feature)
                 except KeyError:
                     print("feature " + feature + "not found in training data")
 
-        self.categorical_data = X.drop(features_to_remove, axis=1)
+        self._categorical_data = X.drop(features_to_remove, axis=1)
 
     def _cell_contains_numeric(self, f, range, x):
         i = self._features.index(f)
@@ -513,24 +521,24 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
         return False
 
     def _calculate_cells(self):
-        self.cells_by_id_ = {}
-        self.cells_ = self._calculate_cells_recursive(0)
+        self._cells_by_id = {}
+        self.cells = self._calculate_cells_recursive(0)
 
     def _calculate_cells_recursive(self, node):
-        feature_index = self.dt_.tree_.feature[node]
+        feature_index = self._dt.tree_.feature[node]
         if feature_index == -2:
             # this is a leaf
             # if it is a regression problem we do not use label
             label = self._calculate_cell_label(node) if not self.is_regression else 1
-            hist = [int(i) for i in self.dt_.tree_.value[node][0]] if not self.is_regression else []
+            hist = [int(i) for i in self._dt.tree_.value[node][0]] if not self.is_regression else []
             cell = {'label': label, 'hist': hist, 'ranges': {}, 'id': int(node)}
             return [cell]
 
         cells = []
-        feature = self.categorical_data.columns[feature_index]
-        threshold = self.dt_.tree_.threshold[node]
-        left_child = self.dt_.tree_.children_left[node]
-        right_child = self.dt_.tree_.children_right[node]
+        feature = self._categorical_data.columns[feature_index]
+        threshold = self._dt.tree_.threshold[node]
+        left_child = self._dt.tree_.children_left[node]
+        right_child = self._dt.tree_.children_right[node]
 
         left_child_cells = self._calculate_cells_recursive(left_child)
         for cell in left_child_cells:
@@ -539,7 +547,7 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
             if cell['ranges'][feature]['end'] is None:
                 cell['ranges'][feature]['end'] = threshold
             cells.append(cell)
-            self.cells_by_id_[cell['id']] = cell
+            self._cells_by_id[cell['id']] = cell
 
         right_child_cells = self._calculate_cells_recursive(right_child)
         for cell in right_child_cells:
@@ -548,26 +556,26 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
             if cell['ranges'][feature]['start'] is None:
                 cell['ranges'][feature]['start'] = threshold
             cells.append(cell)
-            self.cells_by_id_[cell['id']] = cell
+            self._cells_by_id[cell['id']] = cell
 
         return cells
 
     def _calculate_cell_label(self, node):
-        label_hist = self.dt_.tree_.value[node][0]
-        return int(self.dt_.classes_[np.argmax(label_hist)])
+        label_hist = self._dt.tree_.value[node][0]
+        return int(self._dt.classes_[np.argmax(label_hist)])
 
     def _modify_cells(self):
         cells = []
-        features = self.categorical_data.columns
-        for cell in self.cells_:
+        features = self._categorical_data.columns
+        for cell in self.cells:
             new_cell = {'id': cell['id'], 'label': cell['label'], 'ranges': {}, 'categories': {}, 'hist': cell['hist'],
                         'representative': None}
             for feature in features:
-                if feature in self.oneHotVectorFeaturesToFeatures.keys():
+                if feature in self._one_hot_vector_features_to_features.keys():
                     # feature is categorical and should be mapped
-                    categorical_feature = self.oneHotVectorFeaturesToFeatures[feature]
+                    categorical_feature = self._one_hot_vector_features_to_features[feature]
                     if categorical_feature not in new_cell['categories'].keys():
-                        new_cell['categories'][categorical_feature] = self.categorical_values[
+                        new_cell['categories'][categorical_feature] = self._categorical_values[
                             categorical_feature].copy()
                     if feature in cell['ranges'].keys():
                         categorical_value = feature[len(categorical_feature) + 1:]
@@ -584,11 +592,11 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
                     else:
                         new_cell['ranges'][feature] = {'start': None, 'end': None}
             cells.append(new_cell)
-            self.cells_by_id_[new_cell['id']] = new_cell
-        self.cells_ = cells
+            self._cells_by_id[new_cell['id']] = new_cell
+        self.cells = cells
 
     def _calculate_level_cells(self, level):
-        if level < 0 or level > self.dt_.get_depth():
+        if level < 0 or level > self._dt.get_depth():
             raise TypeError("Illegal level %d' % level", level)
 
         if level > 0:
@@ -597,13 +605,13 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
             nodes = self._get_nodes_level(level)
             if nodes:
                 for node in nodes:
-                    if self.dt_.tree_.feature[node] == -2:  # leaf node
-                        new_cell = self.cells_by_id_[node]
+                    if self._dt.tree_.feature[node] == -2:  # leaf node
+                        new_cell = self._cells_by_id[node]
                     else:
-                        left_child = self.dt_.tree_.children_left[node]
-                        right_child = self.dt_.tree_.children_right[node]
-                        left_cell = self.cells_by_id_[left_child]
-                        right_cell = self.cells_by_id_[right_child]
+                        left_child = self._dt.tree_.children_left[node]
+                        right_child = self._dt.tree_.children_right[node]
+                        left_cell = self._cells_by_id[left_child]
+                        right_cell = self._cells_by_id[right_child]
                         new_cell = {'id': int(node), 'ranges': {}, 'categories': {}, 'untouched': [],
                                     'label': None, 'representative': None}
                         for feature in left_cell['ranges'].keys():
@@ -620,28 +628,28 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
                         self._calculate_level_cell_label(left_cell, right_cell, new_cell)
                     new_cells.append(new_cell)
                     new_cells_by_id[new_cell['id']] = new_cell
-                self.cells_ = new_cells
-                self.cells_by_id_ = new_cells_by_id
+                self.cells = new_cells
+                self._cells_by_id = new_cells_by_id
             # else: nothing to do, stay with previous cells
 
     def _calculate_level_cell_label(self, left_cell, right_cell, new_cell):
         new_cell['hist'] = [x + y for x, y in
                             zip(left_cell['hist'], right_cell['hist'])] if not self.is_regression else []
-        new_cell['label'] = int(self.dt_.classes_[np.argmax(new_cell['hist'])]) if not self.is_regression else 1
+        new_cell['label'] = int(self._dt.classes_[np.argmax(new_cell['hist'])]) if not self.is_regression else 1
 
     def _get_nodes_level(self, level):
         # level = distance from lowest leaf
-        node_depth = np.zeros(shape=self.dt_.tree_.node_count, dtype=np.int64)
-        is_leaves = np.zeros(shape=self.dt_.tree_.node_count, dtype=bool)
+        node_depth = np.zeros(shape=self._dt.tree_.node_count, dtype=np.int64)
+        is_leaves = np.zeros(shape=self._dt.tree_.node_count, dtype=bool)
         stack = [(0, -1)]  # seed is the root node id and its parent depth
         while len(stack) > 0:
             node_id, parent_depth = stack.pop()
             # depth = distance from root
             node_depth[node_id] = parent_depth + 1
 
-            if self.dt_.tree_.children_left[node_id] != self.dt_.tree_.children_right[node_id]:
-                stack.append((self.dt_.tree_.children_left[node_id], parent_depth + 1))
-                stack.append((self.dt_.tree_.children_right[node_id], parent_depth + 1))
+            if self._dt.tree_.children_left[node_id] != self._dt.tree_.children_right[node_id]:
+                stack.append((self._dt.tree_.children_left[node_id], parent_depth + 1))
+                stack.append((self._dt.tree_.children_right[node_id], parent_depth + 1))
             else:
                 is_leaves[node_id] = True
 
@@ -660,7 +668,7 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
         # if there is no categorical data prepared data is original data
         nodeIds = self._find_sample_nodes(prepared_data, level_nodes)
         labels_df = pd.DataFrame(labelFeature, columns=['label'])
-        for cell in self.cells_:
+        for cell in self.cells:
             cell['representative'] = {}
             # get all rows in cell
             indexes = [i for i, x in enumerate(nodeIds) if x == cell['id']]
@@ -695,14 +703,14 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
                 cell['representative'][feature] = row[feature]
 
     def _find_sample_nodes(self, samples, nodes):
-        paths = self.dt_.decision_path(samples).toarray()
+        paths = self._dt.decision_path(samples).toarray()
         nodeSet = set(nodes)
         return [(list(set([i for i, v in enumerate(p) if v == 1]) & nodeSet))[0] for p in paths]
 
     def _generalize(self, original_data, prepared_data, level_nodes, cells, cells_by_id):
         # prepared data include one hot encoded categorical data + QI
         representatives = pd.DataFrame(columns=self._features)  # empty except for columns
-        generalized = pd.DataFrame(prepared_data, columns=self.categorical_data.columns, copy=True)
+        generalized = pd.DataFrame(prepared_data, columns=self._categorical_data.columns, copy=True)
         original_data_generalized = pd.DataFrame(original_data, columns=self._features, copy=True)
         mapping_to_cells = self._map_to_cells(generalized, level_nodes, cells_by_id)
         # iterate over cells (leaves in decision tree)
@@ -755,7 +763,7 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
                                               current_accuracy)
         if feature is None:
             return None
-        GeneralizeToRepresentative._remove_feature_from_cells(self.cells_, self.cells_by_id_, feature)
+        GeneralizeToRepresentative._remove_feature_from_cells(self.cells, self._cells_by_id, feature)
         return feature
 
     def _get_feature_to_remove(self, original_data, prepared_data, nodes, labels, feature_data, current_accuracy):
@@ -763,7 +771,7 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
         # if there is no categorical data prepared data is original data
         # We want to remove features with low iLoss (NCP) and high accuracy gain
         # (after removing them)
-        ranges = self.generalizations_['ranges']
+        ranges = self._generalizations['ranges']
         range_counts = self._find_range_count(original_data, ranges)
         total = prepared_data.size
         range_min = sys.float_info.max
@@ -772,15 +780,15 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
         category_counts = self._find_categories_count(original_data, categories)
 
         for feature in ranges.keys():
-            if feature not in self.generalizations_['untouched']:
+            if feature not in self._generalizations['untouched']:
                 feature_ncp = self._calc_ncp_numeric(ranges[feature],
                                                      range_counts[feature],
                                                      feature_data[feature],
                                                      total)
                 if feature_ncp > 0:
                     # divide by accuracy gain
-                    new_cells = copy.deepcopy(self.cells_)
-                    cells_by_id = copy.deepcopy(self.cells_by_id_)
+                    new_cells = copy.deepcopy(self.cells)
+                    cells_by_id = copy.deepcopy(self._cells_by_id)
                     GeneralizeToRepresentative._remove_feature_from_cells(new_cells, cells_by_id, feature)
                     generalized = self._generalize(original_data, prepared_data, nodes, new_cells, cells_by_id)
                     accuracy_gain = self.estimator.score(ArrayDataset(self._preprocessor.transform(generalized),
@@ -802,8 +810,8 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
                                                          total)
                 if feature_ncp > 0:
                     # divide by accuracy loss
-                    new_cells = copy.deepcopy(self.cells_)
-                    cells_by_id = copy.deepcopy(self.cells_by_id_)
+                    new_cells = copy.deepcopy(self.cells)
+                    cells_by_id = copy.deepcopy(self._cells_by_id)
                     GeneralizeToRepresentative._remove_feature_from_cells(new_cells, cells_by_id, feature)
                     generalized = self._generalize(original_data, prepared_data, nodes, new_cells, cells_by_id)
                     accuracy_gain = self.estimator.score(ArrayDataset(self._preprocessor.transform(generalized),
@@ -821,12 +829,12 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
         return remove_feature
 
     def _calculate_generalizations(self):
-        self.generalizations_ = {'ranges': GeneralizeToRepresentative._calculate_ranges(self.cells_),
-                                 'categories': GeneralizeToRepresentative._calculate_categories(self.cells_),
-                                 'untouched': GeneralizeToRepresentative._calculate_untouched(self.cells_)}
+        self._generalizations = {'ranges': GeneralizeToRepresentative._calculate_ranges(self.cells),
+                                 'categories': GeneralizeToRepresentative._calculate_categories(self.cells),
+                                 'untouched': GeneralizeToRepresentative._calculate_untouched(self.cells)}
 
     def _find_range_count(self, samples, ranges):
-        samples_df = pd.DataFrame(samples, columns=self.categorical_data.columns)
+        samples_df = pd.DataFrame(samples, columns=self._categorical_data.columns)
         range_counts = {}
         last_value = None
         for r in ranges.keys():
diff --git a/apt/utils/dataset_utils.py b/apt/utils/dataset_utils.py
index e395717..2b119b5 100644
--- a/apt/utils/dataset_utils.py
+++ b/apt/utils/dataset_utils.py
@@ -6,7 +6,7 @@ from os import path, mkdir
 from six.moves.urllib.request import urlretrieve
 
 
-def get_iris_dataset(test_set: float = 0.3):
+def get_iris_dataset_np(test_set: float = 0.3):
     """
     Loads the Iris dataset from scikit-learn.
 
@@ -29,7 +29,7 @@ def _load_iris(test_set_size: float = 0.3):
     return (x_train, y_train), (x_test, y_test)
 
 
-def get_diabetes_dataset(test_set: float = 0.3):
+def get_diabetes_dataset_np(test_set: float = 0.3):
     """
     Loads the Diabetes dataset from scikit-learn.
 
@@ -52,7 +52,7 @@ def _load_diabetes(test_set_size: float = 0.3):
     return (x_train, y_train), (x_test, y_test)
 
 
-def get_german_credit_dataset(test_set: float = 0.3):
+def get_german_credit_dataset_pd(test_set: float = 0.3):
     """
     Loads the UCI German credit dataset from `tests/datasets/german` or downloads it from
     https://archive.ics.uci.edu/ml/machine-learning-databases/statlog/german/ if necessary.
@@ -122,11 +122,16 @@ def _modify_german_dataset(data):
             return 1
         else:
             raise Exception('Bad value')
+
+    def modify_label(value):
+        return value - 1
+
     data['Foreign_worker'] = data['Foreign_worker'].apply(modify_Foreign_worker)
     data['Telephone'] = data['Telephone'].apply(modify_Telephone)
+    data['label'] = data['label'].apply(modify_label)
 
 
-def get_adult_dataset():
+def get_adult_dataset_pd():
     """
     Loads the UCI Adult dataset from `tests/datasets/adult` or downloads it from
     https://archive.ics.uci.edu/ml/machine-learning-databases/adult/ if necessary.
@@ -228,7 +233,7 @@ def _modify_adult_dataset(data):
     return data.drop(['fnlwgt', 'education'], axis=1)
 
 
-def get_nursery_dataset(raw: bool = True, test_set: float = 0.2, transform_social: bool = False):
+def get_nursery_dataset_pd(raw: bool = True, test_set: float = 0.2, transform_social: bool = False):
     """
     Loads the UCI Nursery dataset from `tests/datasets/nursery` or downloads it from
     https://archive.ics.uci.edu/ml/machine-learning-databases/nursery/ if necessary.
diff --git a/apt/utils/datasets/datasets.py b/apt/utils/datasets/datasets.py
index 9383a2f..02d886e 100644
--- a/apt/utils/datasets/datasets.py
+++ b/apt/utils/datasets/datasets.py
@@ -5,7 +5,7 @@ Implementation of utility classes for dataset handling
 """
 
 from abc import ABCMeta, abstractmethod
-from typing import Callable, Collection, Any, Union, List, Optional
+from typing import Callable, Collection, Any, Union, List, Optional, Type
 
 import tarfile
 import os
@@ -19,9 +19,9 @@ from torch import Tensor
 logger = logging.getLogger(__name__)
 
 
-INPUT_DATA_ARRAY_TYPE = Union[np.ndarray, pd.DataFrame, List, Tensor]
+INPUT_DATA_ARRAY_TYPE = Union[np.ndarray, pd.DataFrame, pd.Series, List, Tensor]
 OUTPUT_DATA_ARRAY_TYPE = np.ndarray
-DATA_PANDAS_NUMPY_TYPE = Union[np.ndarray, pd.DataFrame]
+DATA_PANDAS_NUMPY_TYPE = Union[np.ndarray, pd.DataFrame, pd.Series]
 
 
 class Dataset(metaclass=ABCMeta):
@@ -323,7 +323,7 @@ class DatasetFactory:
         :return: a Callable that returns the registered dataset class
         """
 
-        def inner_wrapper(wrapped_class: Dataset) -> Any:
+        def inner_wrapper(wrapped_class: Type[Dataset]) -> Any:
             if name in cls.registry:
                 logger.warning('Dataset %s already exists. Will replace it', name)
             cls.registry[name] = wrapped_class
@@ -414,14 +414,18 @@ class Data:
         """
         Get test set samples
 
-        :return: test samples
+        :return: test samples, or None if no test data provided
         """
+        if self.test is None:
+            return None
         return self.test.get_samples()
 
     def get_test_labels(self) -> Collection[Any]:
         """
         Get test set labels
 
-        :return: test labels
+        :return: test labels, or None if no test data provided
         """
+        if self.test is None:
+            return None
         return self.test.get_labels()
diff --git a/apt/utils/models/__init__.py b/apt/utils/models/__init__.py
index 11efd5f..f6a89fc 100644
--- a/apt/utils/models/__init__.py
+++ b/apt/utils/models/__init__.py
@@ -1,2 +1,3 @@
-from apt.utils.models.model import Model, ModelOutputType
+from apt.utils.models.model import Model, BlackboxClassifier, ModelOutputType, ScoringMethod
 from apt.utils.models.sklearn_model import SklearnModel, SklearnClassifier, SklearnRegressor
+from apt.utils.models.keras_model import KerasClassifier
diff --git a/apt/utils/models/keras_model.py b/apt/utils/models/keras_model.py
new file mode 100644
index 0000000..12d8ba3
--- /dev/null
+++ b/apt/utils/models/keras_model.py
@@ -0,0 +1,149 @@
+from typing import Optional
+
+import numpy as np
+from sklearn.preprocessing import OneHotEncoder
+
+import tensorflow as tf
+from tensorflow import keras
+tf.compat.v1.disable_eager_execution()
+
+from apt.utils.models import Model, ModelOutputType, ScoringMethod
+from apt.utils.datasets import Dataset, OUTPUT_DATA_ARRAY_TYPE
+
+from art.utils import check_and_transform_label_format
+from art.estimators.classification.keras import KerasClassifier as ArtKerasClassifier
+# from art.estimators.regression.keras import KerasRegressor as ArtKerasRegressor
+
+
+class KerasModel(Model):
+    """
+    Wrapper class for keras models.
+    """
+
+
+
+class KerasClassifier(KerasModel):
+    """
+    Wrapper class for keras classification models.
+
+    :param model: The original keras model object.
+    :type model: `keras.models.Model`
+    :param output_type: The type of output the model yields (vector/label only)
+    :type output_type: `ModelOutputType`
+    :param black_box_access: Boolean describing the type of deployment of the model (when in production).
+                             Set to True if the model is only available via query (API) access, i.e.,
+                             only the outputs of the model are exposed, and False if the model internals
+                             are also available. Default is True.
+    :type black_box_access: boolean, optional
+    :param unlimited_queries: If black_box_access is True, this boolean indicates whether a user can perform
+                              unlimited queries to the model API or whether there is a limit to the number of
+                              queries that can be submitted. Default is True.
+    :type unlimited_queries: boolean, optional
+    """
+    def __init__(self, model: keras.models.Model, output_type: ModelOutputType, black_box_access: Optional[bool] = True,
+                 unlimited_queries: Optional[bool] = True, **kwargs):
+        super().__init__(model, output_type, black_box_access, unlimited_queries, **kwargs)
+        logits = False
+        if output_type == ModelOutputType.CLASSIFIER_LOGITS:
+            logits = True
+        self._art_model = ArtKerasClassifier(model, use_logits=logits)
+
+    def fit(self, train_data: Dataset, **kwargs) -> None:
+        """
+        Fit the model using the training data.
+
+        :param train_data: Training data. Labels are expected to either be one-hot encoded or a 1D-array of categorical
+                           labels (consecutive integers starting at 0).
+        :type train_data: `Dataset`
+        :return: None
+        """
+        y_encoded = check_and_transform_label_format(train_data.get_labels())
+        self._art_model.fit(train_data.get_samples(), y_encoded, **kwargs)
+
+    def predict(self, x: Dataset, **kwargs) -> OUTPUT_DATA_ARRAY_TYPE:
+        """
+        Perform predictions using the model for input `x`.
+
+        :param x: Input samples.
+        :type x: `Dataset`
+        :return: Predictions from the model as numpy array (class probabilities, if supported).
+        """
+        return self._art_model.predict(x.get_samples(), **kwargs)
+
+    def score(self, test_data: Dataset, scoring_method: Optional[ScoringMethod] = ScoringMethod.ACCURACY, **kwargs):
+        """
+        Score the model using test data.
+
+        :param test_data: Test data.
+        :type train_data: `Dataset`
+        :param scoring_method: The method for scoring predictions. Default is ACCURACY.
+        :type scoring_method: `ScoringMethod`, optional
+        :return: the score as float (between 0 and 1)
+        """
+        y = check_and_transform_label_format(test_data.get_labels(), self._art_model.nb_classes)
+        predicted = self.predict(test_data)
+        if scoring_method == ScoringMethod.ACCURACY:
+            return np.count_nonzero(np.argmax(y, axis=1) == np.argmax(predicted, axis=1)) / predicted.shape[0]
+        else:
+            raise NotImplementedError
+
+
+# class KerasRegressor(KerasModel):
+#     """
+#     Wrapper class for keras regression models.
+#
+#     :param model: The original keras model object.
+#     :type model: `keras.models.Model`
+#     :param black_box_access: Boolean describing the type of deployment of the model (when in production).
+#                              Set to True if the model is only available via query (API) access, i.e.,
+#                              only the outputs of the model are exposed, and False if the model internals
+#                              are also available. Default is True.
+#     :type black_box_access: boolean, optional
+#     :param unlimited_queries: If black_box_access is True, this boolean indicates whether a user can perform
+#                               unlimited queries to the model API or whether there is a limit to the number of
+#                               queries that can be submitted. Default is True.
+#     :type unlimited_queries: boolean, optional
+#     """
+#     def __init__(self, model: keras.models.Model, black_box_access: Optional[bool] = True,
+#                  unlimited_queries: Optional[bool] = True, **kwargs):
+#         super().__init__(model, ModelOutputType.REGRESSOR_SCALAR, black_box_access, unlimited_queries, **kwargs)
+#         self._art_model = ArtKerasRegressor(model)
+#
+#     def fit(self, train_data: Dataset, **kwargs) -> None:
+#         """
+#         Fit the model using the training data.
+#
+#         :param train_data: Training data.
+#         :type train_data: `Dataset`
+#         :return: None
+#         """
+#         self._art_model.fit(train_data.get_samples(), train_data.get_labels(), **kwargs)
+#
+#     def predict(self, x: Dataset, **kwargs) -> OUTPUT_DATA_ARRAY_TYPE:
+#         """
+#         Perform predictions using the model for input `x`.
+#
+#         :param x: Input samples.
+#         :type x: `Dataset`
+#         :return: Predictions from the model as numpy array.
+#         """
+#         return self._art_model.predict(x.get_samples(), **kwargs)
+#
+#     def score(self, test_data: Dataset, scoring_method: Optional[ScoringMethod] = ScoringMethod.MEAN_SQUARED_ERROR,
+#               **kwargs):
+#         """
+#         Score the model using test data.
+#
+#         :param test_data: Test data.
+#         :type train_data: `Dataset`
+#         :param scoring_method: The method for scoring predictions. Default is ACCURACY.
+#         :type scoring_method: `ScoringMethod`, optional
+#         :return: the score as float
+#         """
+#         y = check_and_transform_label_format(test_data.get_labels(), self._art_model.nb_classes)
+#         predicted = self.predict(test_data)
+#         if scoring_method == ScoringMethod.MEAN_SQUARED_ERROR:
+#             mse = keras.losses.MeanSquaredError(reduction=keras.losses.Reduction.SUM)
+#             return mse(y, predicted).numpy()
+#         else:
+#             raise NotImplementedError('Only MEAN_SQUARED_ERROR supported as scoring method')
diff --git a/apt/utils/models/model.py b/apt/utils/models/model.py
index c362fb5..7af3a01 100644
--- a/apt/utils/models/model.py
+++ b/apt/utils/models/model.py
@@ -1,16 +1,25 @@
 from abc import ABCMeta, abstractmethod
 from typing import Any, Optional
 from enum import Enum, auto
+import numpy as np
 
-from apt.utils.datasets import Dataset, OUTPUT_DATA_ARRAY_TYPE
+from apt.utils.datasets import Dataset, Data, OUTPUT_DATA_ARRAY_TYPE
+from art.estimators.classification import BlackBoxClassifier
+from art.utils import check_and_transform_label_format
 
 
 class ModelOutputType(Enum):
-    CLASSIFIER_VECTOR = auto()  # probabilities or logits
+    CLASSIFIER_PROBABILITIES = auto()  # vector of probabilities
+    CLASSIFIER_LOGITS = auto()  # vector of logits
     CLASSIFIER_SCALAR = auto()  # label only
     REGRESSOR_SCALAR = auto()  # value
 
 
+class ScoringMethod(Enum):
+    ACCURACY = auto()  # number of correct predictions divided by the number of samples
+    MEAN_SQUARED_ERROR = auto()  # mean squared error between the predictions and true labels
+
+
 class Model(metaclass=ABCMeta):
     """
     Abstract base class for ML model wrappers.
@@ -54,7 +63,7 @@ class Model(metaclass=ABCMeta):
         Perform predictions using the model for input `x`.
 
         :param x: Input samples.
-        :type x: `np.ndarray` or `pandas.DataFrame`
+        :type x: `Dataset`
         :return: Predictions from the model as numpy array.
         """
         raise NotImplementedError
@@ -107,3 +116,87 @@ class Model(metaclass=ABCMeta):
         :return: True if a user can perform unlimited queries to the model API, otherwise False.
         """
         return self._unlimited_queries
+
+    def get_nb_classes(self, y: OUTPUT_DATA_ARRAY_TYPE) -> int:
+        """
+        Get the number of classes from an array of labels
+
+        :param y: the labels
+        :type y: numpy array
+        :return: the number of classes as integer
+        """
+        if len(y.shape) == 1:
+            return len(np.unique(y))
+        else:
+            return y.shape[1]
+
+
+class BlackboxClassifier(Model):
+    """
+    Wrapper for black-box ML classification models.
+
+    :param model: The training and/or test data along with the model's predictions for the data. Assumes that the data
+                  is represented as numpy arrays. Labels are expected to either be one-hot encoded or
+                  a 1D-array of categorical labels (consecutive integers starting at 0).
+    :type model: `Data` object
+    :param output_type: The type of output the model yields (vector/label only for classifiers,
+                        value for regressors)
+    :type output_type: `ModelOutputType`
+    :param black_box_access: Boolean describing the type of deployment of the model (when in production).
+                             Always assumed to be True for this wrapper.
+    :type black_box_access: boolean, optional
+    :param unlimited_queries: Boolean indicating whether a user can perform unlimited queries to the model API.
+                              Always assumed to be False for this wrapper.
+    :type unlimited_queries: boolean, optional
+    """
+
+    def __init__(self, model: Data, output_type: ModelOutputType, black_box_access: Optional[bool] = True,
+                 unlimited_queries: Optional[bool] = True, **kwargs):
+        super().__init__(model, output_type, black_box_access=True, unlimited_queries=False, **kwargs)
+        x = model.get_train_samples()
+        y = model.get_train_labels()
+        self.nb_classes = self.get_nb_classes(y)
+        y = check_and_transform_label_format(y, nb_classes=self.nb_classes)
+
+        if model.get_test_samples() is not None and type(x) == np.ndarray:
+            x = np.vstack((x, model.get_test_samples()))
+
+        if model.get_test_labels() is not None and type(y) == np.ndarray:
+            y = np.vstack((y, check_and_transform_label_format(model.get_test_labels(), nb_classes=self.nb_classes)))
+
+        predict_fn = (x, y)
+        self._art_model = BlackBoxClassifier(predict_fn, x.shape[1:], self.nb_classes, fuzzy_float_compare=True)
+
+    def fit(self, train_data: Dataset, **kwargs) -> None:
+        """
+        A blackbox model cannot be fit.
+        """
+        raise NotImplementedError
+
+    def predict(self, x: Dataset, **kwargs) -> OUTPUT_DATA_ARRAY_TYPE:
+        """
+        Get predictions from the model for input `x`. `x` must be a subset of the data provided in the `model` data in
+        `__init__()`.
+
+        :param x: Input samples.
+        :type x: `Dataset`
+        :return: Predictions from the model as numpy array.
+        """
+        return self._art_model.predict(x.get_samples())
+
+    def score(self, test_data: Dataset, scoring_method: Optional[ScoringMethod] = ScoringMethod.ACCURACY, **kwargs):
+        """
+        Score the model using test data.
+
+        :param test_data: Test data.
+        :type train_data: `Dataset`
+        :param scoring_method: The method for scoring predictions. Default is ACCURACY.
+        :type scoring_method: `ScoringMethod`, optional
+        :return: the score as float (for classifiers, between 0 and 1)
+        """
+        predicted = self._art_model.predict(test_data.get_samples())
+        y = check_and_transform_label_format(test_data.get_labels(), nb_classes=self.nb_classes)
+        if scoring_method == ScoringMethod.ACCURACY:
+            return np.count_nonzero(np.argmax(y, axis=1) == np.argmax(predicted, axis=1)) / predicted.shape[0]
+        else:
+            raise NotImplementedError
diff --git a/apt/utils/models/sklearn_model.py b/apt/utils/models/sklearn_model.py
index a64058e..81294a5 100644
--- a/apt/utils/models/sklearn_model.py
+++ b/apt/utils/models/sklearn_model.py
@@ -1,7 +1,5 @@
 from typing import Optional
 
-import numpy as np
-
 from sklearn.preprocessing import OneHotEncoder
 from sklearn.base import BaseEstimator
 
@@ -10,6 +8,7 @@ from apt.utils.datasets import Dataset, OUTPUT_DATA_ARRAY_TYPE
 
 from art.estimators.classification.scikitlearn import SklearnClassifier as ArtSklearnClassifier
 from art.estimators.regression.scikitlearn import ScikitlearnRegressor
+from art.utils import check_and_transform_label_format
 
 
 class SklearnModel(Model):
@@ -54,12 +53,14 @@ class SklearnClassifier(SklearnModel):
         """
         Fit the model using the training data.
 
-        :param train_data: Training data.
+        :param train_data: Training data. Labels are expected to either be one-hot encoded or a 1D-array of categorical
+                           labels (consecutive integers starting at 0).
         :type train_data: `Dataset`
         :return: None
         """
-        encoder = OneHotEncoder(sparse=False)
-        y_encoded = encoder.fit_transform(train_data.get_labels().reshape(-1, 1))
+        y = train_data.get_labels()
+        self.nb_classes = self.get_nb_classes(y)
+        y_encoded = check_and_transform_label_format(y, nb_classes=self.nb_classes)
         self._art_model.fit(train_data.get_samples(), y_encoded, **kwargs)
 
     def predict(self, x: Dataset, **kwargs) -> OUTPUT_DATA_ARRAY_TYPE:
@@ -70,7 +71,7 @@ class SklearnClassifier(SklearnModel):
         :type x: `Dataset`
         :return: Predictions from the model as numpy array (class probabilities, if supported).
         """
-        return self._art_model.predict(x, **kwargs)
+        return self._art_model.predict(x.get_samples(), **kwargs)
 
 
 class SklearnRegressor(SklearnModel):
@@ -112,4 +113,4 @@ class SklearnRegressor(SklearnModel):
         :type x: `Dataset`
         :return: Predictions from the model as numpy array.
         """
-        return self._art_model.predict(x, **kwargs)
+        return self._art_model.predict(x.get_samples(), **kwargs)
diff --git a/notebooks/attribute_inference_anonymization_nursery.ipynb b/notebooks/attribute_inference_anonymization_nursery.ipynb
index bfba540..19d9675 100644
--- a/notebooks/attribute_inference_anonymization_nursery.ipynb
+++ b/notebooks/attribute_inference_anonymization_nursery.ipynb
@@ -29,15 +29,198 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 1,
+   "execution_count": 121,
    "metadata": {},
    "outputs": [
     {
      "data": {
-      "text/plain": "           parents     has_nurs        form children     housing     finance  \\\n8450   pretentious    very_crit      foster        1   less_conv  convenient   \n12147   great_pret    very_crit    complete        1    critical      inconv   \n2780         usual     critical    complete        4   less_conv  convenient   \n11924   great_pret     critical      foster        1    critical  convenient   \n59           usual       proper    complete        2  convenient  convenient   \n...            ...          ...         ...      ...         ...         ...   \n5193   pretentious  less_proper    complete        1  convenient      inconv   \n1375         usual  less_proper  incomplete        2   less_conv  convenient   \n10318   great_pret  less_proper      foster        4  convenient  convenient   \n6396   pretentious     improper   completed        3   less_conv  convenient   \n485          usual       proper  incomplete        1    critical      inconv   \n\n       social       health  \n8450        1    not_recom  \n12147       1  recommended  \n2780        1    not_recom  \n11924       1    not_recom  \n59          0    not_recom  \n...       ...          ...  \n5193        0  recommended  \n1375        1     priority  \n10318       0     priority  \n6396        1  recommended  \n485         1    not_recom  \n\n[10366 rows x 8 columns]",
-      "text/html": "<div>\n<style scoped>\n    .dataframe tbody tr th:only-of-type {\n        vertical-align: middle;\n    }\n\n    .dataframe tbody tr th {\n        vertical-align: top;\n    }\n\n    .dataframe thead th {\n        text-align: right;\n    }\n</style>\n<table border=\"1\" class=\"dataframe\">\n  <thead>\n    <tr style=\"text-align: right;\">\n      <th></th>\n      <th>parents</th>\n      <th>has_nurs</th>\n      <th>form</th>\n      <th>children</th>\n      <th>housing</th>\n      <th>finance</th>\n      <th>social</th>\n      <th>health</th>\n    </tr>\n  </thead>\n  <tbody>\n    <tr>\n      <th>8450</th>\n      <td>pretentious</td>\n      <td>very_crit</td>\n      <td>foster</td>\n      <td>1</td>\n      <td>less_conv</td>\n      <td>convenient</td>\n      <td>1</td>\n      <td>not_recom</td>\n    </tr>\n    <tr>\n      <th>12147</th>\n      <td>great_pret</td>\n      <td>very_crit</td>\n      <td>complete</td>\n      <td>1</td>\n      <td>critical</td>\n      <td>inconv</td>\n      <td>1</td>\n      <td>recommended</td>\n    </tr>\n    <tr>\n      <th>2780</th>\n      <td>usual</td>\n      <td>critical</td>\n      <td>complete</td>\n      <td>4</td>\n      <td>less_conv</td>\n      <td>convenient</td>\n      <td>1</td>\n      <td>not_recom</td>\n    </tr>\n    <tr>\n      <th>11924</th>\n      <td>great_pret</td>\n      <td>critical</td>\n      <td>foster</td>\n      <td>1</td>\n      <td>critical</td>\n      <td>convenient</td>\n      <td>1</td>\n      <td>not_recom</td>\n    </tr>\n    <tr>\n      <th>59</th>\n      <td>usual</td>\n      <td>proper</td>\n      <td>complete</td>\n      <td>2</td>\n      <td>convenient</td>\n      <td>convenient</td>\n      <td>0</td>\n      <td>not_recom</td>\n    </tr>\n    <tr>\n      <th>...</th>\n      <td>...</td>\n      <td>...</td>\n      <td>...</td>\n      <td>...</td>\n      <td>...</td>\n      <td>...</td>\n      <td>...</td>\n      <td>...</td>\n    </tr>\n    <tr>\n      <th>5193</th>\n      <td>pretentious</td>\n      <td>less_proper</td>\n      <td>complete</td>\n      <td>1</td>\n      <td>convenient</td>\n      <td>inconv</td>\n      <td>0</td>\n      <td>recommended</td>\n    </tr>\n    <tr>\n      <th>1375</th>\n      <td>usual</td>\n      <td>less_proper</td>\n      <td>incomplete</td>\n      <td>2</td>\n      <td>less_conv</td>\n      <td>convenient</td>\n      <td>1</td>\n      <td>priority</td>\n    </tr>\n    <tr>\n      <th>10318</th>\n      <td>great_pret</td>\n      <td>less_proper</td>\n      <td>foster</td>\n      <td>4</td>\n      <td>convenient</td>\n      <td>convenient</td>\n      <td>0</td>\n      <td>priority</td>\n    </tr>\n    <tr>\n      <th>6396</th>\n      <td>pretentious</td>\n      <td>improper</td>\n      <td>completed</td>\n      <td>3</td>\n      <td>less_conv</td>\n      <td>convenient</td>\n      <td>1</td>\n      <td>recommended</td>\n    </tr>\n    <tr>\n      <th>485</th>\n      <td>usual</td>\n      <td>proper</td>\n      <td>incomplete</td>\n      <td>1</td>\n      <td>critical</td>\n      <td>inconv</td>\n      <td>1</td>\n      <td>not_recom</td>\n    </tr>\n  </tbody>\n</table>\n<p>10366 rows × 8 columns</p>\n</div>"
+      "text/html": [
+       "<div>\n",
+       "<style scoped>\n",
+       "    .dataframe tbody tr th:only-of-type {\n",
+       "        vertical-align: middle;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe tbody tr th {\n",
+       "        vertical-align: top;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe thead th {\n",
+       "        text-align: right;\n",
+       "    }\n",
+       "</style>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>parents</th>\n",
+       "      <th>has_nurs</th>\n",
+       "      <th>form</th>\n",
+       "      <th>children</th>\n",
+       "      <th>housing</th>\n",
+       "      <th>finance</th>\n",
+       "      <th>social</th>\n",
+       "      <th>health</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>8450</th>\n",
+       "      <td>pretentious</td>\n",
+       "      <td>very_crit</td>\n",
+       "      <td>foster</td>\n",
+       "      <td>1</td>\n",
+       "      <td>less_conv</td>\n",
+       "      <td>convenient</td>\n",
+       "      <td>1</td>\n",
+       "      <td>not_recom</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>12147</th>\n",
+       "      <td>great_pret</td>\n",
+       "      <td>very_crit</td>\n",
+       "      <td>complete</td>\n",
+       "      <td>1</td>\n",
+       "      <td>critical</td>\n",
+       "      <td>inconv</td>\n",
+       "      <td>1</td>\n",
+       "      <td>recommended</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2780</th>\n",
+       "      <td>usual</td>\n",
+       "      <td>critical</td>\n",
+       "      <td>complete</td>\n",
+       "      <td>4</td>\n",
+       "      <td>less_conv</td>\n",
+       "      <td>convenient</td>\n",
+       "      <td>1</td>\n",
+       "      <td>not_recom</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>11924</th>\n",
+       "      <td>great_pret</td>\n",
+       "      <td>critical</td>\n",
+       "      <td>foster</td>\n",
+       "      <td>1</td>\n",
+       "      <td>critical</td>\n",
+       "      <td>convenient</td>\n",
+       "      <td>1</td>\n",
+       "      <td>not_recom</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>59</th>\n",
+       "      <td>usual</td>\n",
+       "      <td>proper</td>\n",
+       "      <td>complete</td>\n",
+       "      <td>2</td>\n",
+       "      <td>convenient</td>\n",
+       "      <td>convenient</td>\n",
+       "      <td>0</td>\n",
+       "      <td>not_recom</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>...</th>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>5193</th>\n",
+       "      <td>pretentious</td>\n",
+       "      <td>less_proper</td>\n",
+       "      <td>complete</td>\n",
+       "      <td>1</td>\n",
+       "      <td>convenient</td>\n",
+       "      <td>inconv</td>\n",
+       "      <td>0</td>\n",
+       "      <td>recommended</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1375</th>\n",
+       "      <td>usual</td>\n",
+       "      <td>less_proper</td>\n",
+       "      <td>incomplete</td>\n",
+       "      <td>2</td>\n",
+       "      <td>less_conv</td>\n",
+       "      <td>convenient</td>\n",
+       "      <td>1</td>\n",
+       "      <td>priority</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>10318</th>\n",
+       "      <td>great_pret</td>\n",
+       "      <td>less_proper</td>\n",
+       "      <td>foster</td>\n",
+       "      <td>4</td>\n",
+       "      <td>convenient</td>\n",
+       "      <td>convenient</td>\n",
+       "      <td>0</td>\n",
+       "      <td>priority</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>6396</th>\n",
+       "      <td>pretentious</td>\n",
+       "      <td>improper</td>\n",
+       "      <td>completed</td>\n",
+       "      <td>3</td>\n",
+       "      <td>less_conv</td>\n",
+       "      <td>convenient</td>\n",
+       "      <td>1</td>\n",
+       "      <td>recommended</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>485</th>\n",
+       "      <td>usual</td>\n",
+       "      <td>proper</td>\n",
+       "      <td>incomplete</td>\n",
+       "      <td>1</td>\n",
+       "      <td>critical</td>\n",
+       "      <td>inconv</td>\n",
+       "      <td>1</td>\n",
+       "      <td>not_recom</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "<p>10366 rows × 8 columns</p>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "           parents     has_nurs        form children     housing     finance  \\\n",
+       "8450   pretentious    very_crit      foster        1   less_conv  convenient   \n",
+       "12147   great_pret    very_crit    complete        1    critical      inconv   \n",
+       "2780         usual     critical    complete        4   less_conv  convenient   \n",
+       "11924   great_pret     critical      foster        1    critical  convenient   \n",
+       "59           usual       proper    complete        2  convenient  convenient   \n",
+       "...            ...          ...         ...      ...         ...         ...   \n",
+       "5193   pretentious  less_proper    complete        1  convenient      inconv   \n",
+       "1375         usual  less_proper  incomplete        2   less_conv  convenient   \n",
+       "10318   great_pret  less_proper      foster        4  convenient  convenient   \n",
+       "6396   pretentious     improper   completed        3   less_conv  convenient   \n",
+       "485          usual       proper  incomplete        1    critical      inconv   \n",
+       "\n",
+       "       social       health  \n",
+       "8450        1    not_recom  \n",
+       "12147       1  recommended  \n",
+       "2780        1    not_recom  \n",
+       "11924       1    not_recom  \n",
+       "59          0    not_recom  \n",
+       "...       ...          ...  \n",
+       "5193        0  recommended  \n",
+       "1375        1     priority  \n",
+       "10318       0     priority  \n",
+       "6396        1  recommended  \n",
+       "485         1    not_recom  \n",
+       "\n",
+       "[10366 rows x 8 columns]"
+      ]
      },
-     "execution_count": 1,
+     "execution_count": 121,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -47,9 +230,9 @@
     "import sys\n",
     "sys.path.insert(0, os.path.abspath('..'))\n",
     "\n",
-    "from apt.utils.dataset_utils import get_nursery_dataset\n",
+    "from apt.utils.dataset_utils import get_nursery_dataset_pd\n",
     "\n",
-    "(x_train, y_train), (x_test, y_test) = get_nursery_dataset(transform_social=True)\n",
+    "(x_train, y_train), (x_test, y_test) = get_nursery_dataset_pd(transform_social=True)\n",
     "\n",
     "x_train"
    ]
@@ -63,7 +246,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 2,
+   "execution_count": 122,
    "metadata": {},
    "outputs": [
     {
@@ -78,11 +261,25 @@
     "from sklearn.tree import DecisionTreeClassifier\n",
     "from art.estimators.classification.scikitlearn import ScikitlearnDecisionTreeClassifier\n",
     "from sklearn.preprocessing import OneHotEncoder\n",
+    "from sklearn.compose import ColumnTransformer\n",
+    "from sklearn.impute import SimpleImputer\n",
+    "from sklearn.pipeline import Pipeline\n",
     "\n",
-    "x_train_str = x_train.astype(str)\n",
-    "train_encoded = OneHotEncoder(sparse=False).fit_transform(x_train_str)\n",
-    "x_test_str = x_test.astype(str)\n",
-    "test_encoded = OneHotEncoder(sparse=False).fit_transform(x_test_str)\n",
+    "numeric_features = ['social']\n",
+    "categorical_features = ['children', 'parents', 'has_nurs', 'form', 'housing', 'finance', 'health']\n",
+    "numeric_transformer = Pipeline(\n",
+    "    steps=[('imputer', SimpleImputer(strategy='constant', fill_value=0))]\n",
+    ")\n",
+    "categorical_transformer = OneHotEncoder(handle_unknown=\"ignore\", sparse=False)\n",
+    "preprocessor = ColumnTransformer(\n",
+    "    transformers=[\n",
+    "        (\"num\", numeric_transformer, numeric_features),\n",
+    "        (\"cat\", categorical_transformer, categorical_features),\n",
+    "    ]\n",
+    ")\n",
+    "\n",
+    "train_encoded = preprocessor.fit_transform(x_train)\n",
+    "test_encoded = preprocessor.transform(x_test)\n",
     "    \n",
     "model = DecisionTreeClassifier()\n",
     "model.fit(train_encoded, y_train)\n",
@@ -104,14 +301,15 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 3,
+   "execution_count": 123,
    "metadata": {},
    "outputs": [],
    "source": [
     "import numpy as np\n",
     "from art.attacks.inference.attribute_inference import AttributeInferenceBlackBox\n",
     "\n",
-    "attack_feature = 20\n",
+    "# social feature after preprocessing\n",
+    "attack_feature = 0\n",
     "\n",
     "# training data without attacked feature\n",
     "x_train_for_attack = np.delete(train_encoded, attack_feature, 1)\n",
@@ -140,14 +338,14 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 4,
+   "execution_count": 124,
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "1.0\n"
+      "0.6000385876905268\n"
      ]
     }
    ],
@@ -155,7 +353,7 @@
     "# get inferred values\n",
     "values=[0, 1]\n",
     "\n",
-    "inferred_train_bb = bb_attack.infer(x_train_for_attack[attack_train_size:], x_train_predictions[attack_train_size:], values=values)\n",
+    "inferred_train_bb = bb_attack.infer(x_train_for_attack[attack_train_size:], pred=x_train_predictions[attack_train_size:], values=values)\n",
     "# check accuracy\n",
     "train_acc = np.sum(inferred_train_bb == np.around(x_train_feature[attack_train_size:], decimals=8).reshape(1,-1)) / len(inferred_train_bb)\n",
     "print(train_acc)"
@@ -165,7 +363,7 @@
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "This means that for 64% of the training set, the attacked feature is inferred correctly using this attack."
+    "This means that for 60% of the training set, the attacked feature is inferred correctly using this attack."
    ]
   },
   {
@@ -178,14 +376,14 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 5,
+   "execution_count": 125,
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "0.5122515917422342\n"
+      "0.6980513216284006\n"
      ]
     }
    ],
@@ -225,15 +423,198 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 6,
+   "execution_count": 126,
    "metadata": {},
    "outputs": [
     {
      "data": {
-      "text/plain": "           parents     has_nurs        form children     housing     finance  \\\n0      pretentious    very_crit      foster        1   less_conv  convenient   \n1       great_pret    very_crit    complete        1    critical      inconv   \n2            usual     critical    complete        4   less_conv  convenient   \n3       great_pret     critical      foster        1    critical  convenient   \n4            usual       proper    complete        2  convenient  convenient   \n...            ...          ...         ...      ...         ...         ...   \n10361  pretentious  less_proper    complete        1  convenient      inconv   \n10362        usual  less_proper  incomplete        2   less_conv  convenient   \n10363   great_pret  less_proper      foster        4  convenient  convenient   \n10364  pretentious     improper   completed        3   less_conv  convenient   \n10365        usual       proper  incomplete        1    critical  convenient   \n\n      social       health  \n0          0    not_recom  \n1          1  recommended  \n2          0    not_recom  \n3          0    not_recom  \n4          0    not_recom  \n...      ...          ...  \n10361      0  recommended  \n10362      1     priority  \n10363      0     priority  \n10364      1  recommended  \n10365      0    not_recom  \n\n[10366 rows x 8 columns]",
-      "text/html": "<div>\n<style scoped>\n    .dataframe tbody tr th:only-of-type {\n        vertical-align: middle;\n    }\n\n    .dataframe tbody tr th {\n        vertical-align: top;\n    }\n\n    .dataframe thead th {\n        text-align: right;\n    }\n</style>\n<table border=\"1\" class=\"dataframe\">\n  <thead>\n    <tr style=\"text-align: right;\">\n      <th></th>\n      <th>parents</th>\n      <th>has_nurs</th>\n      <th>form</th>\n      <th>children</th>\n      <th>housing</th>\n      <th>finance</th>\n      <th>social</th>\n      <th>health</th>\n    </tr>\n  </thead>\n  <tbody>\n    <tr>\n      <th>0</th>\n      <td>pretentious</td>\n      <td>very_crit</td>\n      <td>foster</td>\n      <td>1</td>\n      <td>less_conv</td>\n      <td>convenient</td>\n      <td>0</td>\n      <td>not_recom</td>\n    </tr>\n    <tr>\n      <th>1</th>\n      <td>great_pret</td>\n      <td>very_crit</td>\n      <td>complete</td>\n      <td>1</td>\n      <td>critical</td>\n      <td>inconv</td>\n      <td>1</td>\n      <td>recommended</td>\n    </tr>\n    <tr>\n      <th>2</th>\n      <td>usual</td>\n      <td>critical</td>\n      <td>complete</td>\n      <td>4</td>\n      <td>less_conv</td>\n      <td>convenient</td>\n      <td>0</td>\n      <td>not_recom</td>\n    </tr>\n    <tr>\n      <th>3</th>\n      <td>great_pret</td>\n      <td>critical</td>\n      <td>foster</td>\n      <td>1</td>\n      <td>critical</td>\n      <td>convenient</td>\n      <td>0</td>\n      <td>not_recom</td>\n    </tr>\n    <tr>\n      <th>4</th>\n      <td>usual</td>\n      <td>proper</td>\n      <td>complete</td>\n      <td>2</td>\n      <td>convenient</td>\n      <td>convenient</td>\n      <td>0</td>\n      <td>not_recom</td>\n    </tr>\n    <tr>\n      <th>...</th>\n      <td>...</td>\n      <td>...</td>\n      <td>...</td>\n      <td>...</td>\n      <td>...</td>\n      <td>...</td>\n      <td>...</td>\n      <td>...</td>\n    </tr>\n    <tr>\n      <th>10361</th>\n      <td>pretentious</td>\n      <td>less_proper</td>\n      <td>complete</td>\n      <td>1</td>\n      <td>convenient</td>\n      <td>inconv</td>\n      <td>0</td>\n      <td>recommended</td>\n    </tr>\n    <tr>\n      <th>10362</th>\n      <td>usual</td>\n      <td>less_proper</td>\n      <td>incomplete</td>\n      <td>2</td>\n      <td>less_conv</td>\n      <td>convenient</td>\n      <td>1</td>\n      <td>priority</td>\n    </tr>\n    <tr>\n      <th>10363</th>\n      <td>great_pret</td>\n      <td>less_proper</td>\n      <td>foster</td>\n      <td>4</td>\n      <td>convenient</td>\n      <td>convenient</td>\n      <td>0</td>\n      <td>priority</td>\n    </tr>\n    <tr>\n      <th>10364</th>\n      <td>pretentious</td>\n      <td>improper</td>\n      <td>completed</td>\n      <td>3</td>\n      <td>less_conv</td>\n      <td>convenient</td>\n      <td>1</td>\n      <td>recommended</td>\n    </tr>\n    <tr>\n      <th>10365</th>\n      <td>usual</td>\n      <td>proper</td>\n      <td>incomplete</td>\n      <td>1</td>\n      <td>critical</td>\n      <td>convenient</td>\n      <td>0</td>\n      <td>not_recom</td>\n    </tr>\n  </tbody>\n</table>\n<p>10366 rows × 8 columns</p>\n</div>"
+      "text/html": [
+       "<div>\n",
+       "<style scoped>\n",
+       "    .dataframe tbody tr th:only-of-type {\n",
+       "        vertical-align: middle;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe tbody tr th {\n",
+       "        vertical-align: top;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe thead th {\n",
+       "        text-align: right;\n",
+       "    }\n",
+       "</style>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>parents</th>\n",
+       "      <th>has_nurs</th>\n",
+       "      <th>form</th>\n",
+       "      <th>children</th>\n",
+       "      <th>housing</th>\n",
+       "      <th>finance</th>\n",
+       "      <th>social</th>\n",
+       "      <th>health</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>pretentious</td>\n",
+       "      <td>very_crit</td>\n",
+       "      <td>foster</td>\n",
+       "      <td>1</td>\n",
+       "      <td>less_conv</td>\n",
+       "      <td>convenient</td>\n",
+       "      <td>0</td>\n",
+       "      <td>not_recom</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>great_pret</td>\n",
+       "      <td>very_crit</td>\n",
+       "      <td>complete</td>\n",
+       "      <td>1</td>\n",
+       "      <td>critical</td>\n",
+       "      <td>inconv</td>\n",
+       "      <td>1</td>\n",
+       "      <td>recommended</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>usual</td>\n",
+       "      <td>critical</td>\n",
+       "      <td>complete</td>\n",
+       "      <td>4</td>\n",
+       "      <td>less_conv</td>\n",
+       "      <td>convenient</td>\n",
+       "      <td>0</td>\n",
+       "      <td>not_recom</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>great_pret</td>\n",
+       "      <td>critical</td>\n",
+       "      <td>foster</td>\n",
+       "      <td>1</td>\n",
+       "      <td>critical</td>\n",
+       "      <td>convenient</td>\n",
+       "      <td>0</td>\n",
+       "      <td>not_recom</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>usual</td>\n",
+       "      <td>proper</td>\n",
+       "      <td>complete</td>\n",
+       "      <td>2</td>\n",
+       "      <td>convenient</td>\n",
+       "      <td>convenient</td>\n",
+       "      <td>0</td>\n",
+       "      <td>not_recom</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>...</th>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "      <td>...</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>10361</th>\n",
+       "      <td>pretentious</td>\n",
+       "      <td>less_proper</td>\n",
+       "      <td>complete</td>\n",
+       "      <td>1</td>\n",
+       "      <td>convenient</td>\n",
+       "      <td>convenient</td>\n",
+       "      <td>0</td>\n",
+       "      <td>recommended</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>10362</th>\n",
+       "      <td>usual</td>\n",
+       "      <td>less_proper</td>\n",
+       "      <td>incomplete</td>\n",
+       "      <td>2</td>\n",
+       "      <td>less_conv</td>\n",
+       "      <td>inconv</td>\n",
+       "      <td>0</td>\n",
+       "      <td>priority</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>10363</th>\n",
+       "      <td>great_pret</td>\n",
+       "      <td>less_proper</td>\n",
+       "      <td>foster</td>\n",
+       "      <td>4</td>\n",
+       "      <td>convenient</td>\n",
+       "      <td>convenient</td>\n",
+       "      <td>0</td>\n",
+       "      <td>priority</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>10364</th>\n",
+       "      <td>pretentious</td>\n",
+       "      <td>improper</td>\n",
+       "      <td>completed</td>\n",
+       "      <td>3</td>\n",
+       "      <td>less_conv</td>\n",
+       "      <td>convenient</td>\n",
+       "      <td>0</td>\n",
+       "      <td>recommended</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>10365</th>\n",
+       "      <td>usual</td>\n",
+       "      <td>proper</td>\n",
+       "      <td>incomplete</td>\n",
+       "      <td>1</td>\n",
+       "      <td>critical</td>\n",
+       "      <td>convenient</td>\n",
+       "      <td>0</td>\n",
+       "      <td>not_recom</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "<p>10366 rows × 8 columns</p>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "           parents     has_nurs        form children     housing     finance  \\\n",
+       "0      pretentious    very_crit      foster        1   less_conv  convenient   \n",
+       "1       great_pret    very_crit    complete        1    critical      inconv   \n",
+       "2            usual     critical    complete        4   less_conv  convenient   \n",
+       "3       great_pret     critical      foster        1    critical  convenient   \n",
+       "4            usual       proper    complete        2  convenient  convenient   \n",
+       "...            ...          ...         ...      ...         ...         ...   \n",
+       "10361  pretentious  less_proper    complete        1  convenient  convenient   \n",
+       "10362        usual  less_proper  incomplete        2   less_conv      inconv   \n",
+       "10363   great_pret  less_proper      foster        4  convenient  convenient   \n",
+       "10364  pretentious     improper   completed        3   less_conv  convenient   \n",
+       "10365        usual       proper  incomplete        1    critical  convenient   \n",
+       "\n",
+       "      social       health  \n",
+       "0          0    not_recom  \n",
+       "1          1  recommended  \n",
+       "2          0    not_recom  \n",
+       "3          0    not_recom  \n",
+       "4          0    not_recom  \n",
+       "...      ...          ...  \n",
+       "10361      0  recommended  \n",
+       "10362      0     priority  \n",
+       "10363      0     priority  \n",
+       "10364      0  recommended  \n",
+       "10365      0    not_recom  \n",
+       "\n",
+       "[10366 rows x 8 columns]"
+      ]
      },
-     "execution_count": 6,
+     "execution_count": 126,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -244,24 +625,24 @@
     "\n",
     "features = x_train.columns\n",
     "QI = [\"finance\", \"social\", \"health\"]\n",
-    "categorical_features = [\"parents\", \"has_nurs\", \"form\", \"housing\", \"finance\", \"health\", 'children']\n",
-    "QI_indexes = [i for i, v in enumerate(features) if v in QI]\n",
-    "categorical_features_indexes = [i for i, v in enumerate(features) if v in categorical_features]\n",
-    "anonymizer = Anonymize(100, QI_indexes, categorical_features=categorical_features_indexes)\n",
+    "\n",
+    "anonymizer = Anonymize(100, QI, categorical_features=categorical_features)\n",
     "anon = anonymizer.anonymize(ArrayDataset(x_train, x_train_predictions))\n",
-    "anon\n"
+    "anon"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 7,
+   "execution_count": 127,
    "metadata": {},
    "outputs": [
     {
      "data": {
-      "text/plain": "7585"
+      "text/plain": [
+       "7585"
+      ]
      },
-     "execution_count": 7,
+     "execution_count": 127,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -273,14 +654,16 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 8,
+   "execution_count": 128,
    "metadata": {},
    "outputs": [
     {
      "data": {
-      "text/plain": "5766"
+      "text/plain": [
+       "3001"
+      ]
      },
-     "execution_count": 8,
+     "execution_count": 128,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -299,20 +682,20 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 9,
+   "execution_count": 129,
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Anonymized model accuracy:  0.9976851851851852\n"
+      "Anonymized model accuracy:  0.9054783950617284\n"
      ]
     }
    ],
    "source": [
-    "anon_str = anon.astype(str)\n",
-    "anon_encoded = OneHotEncoder(sparse=False).fit_transform(anon_str)\n",
+    "anon_encoded = preprocessor.fit_transform(anon)\n",
+    "test_encoded = preprocessor.transform(x_test)\n",
     "\n",
     "anon_model = DecisionTreeClassifier()\n",
     "anon_model.fit(anon_encoded, y_train)\n",
@@ -332,18 +715,23 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 10,
+   "execution_count": 130,
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "1.0\n"
+      "0.5813235577850666\n"
      ]
     }
    ],
    "source": [
+    "# training data without attacked feature\n",
+    "x_train_for_attack = np.delete(train_encoded, attack_feature, 1)\n",
+    "# only attacked feature\n",
+    "x_train_feature = train_encoded[:, attack_feature].copy().reshape(-1, 1)\n",
+    "\n",
     "anon_bb_attack = AttributeInferenceBlackBox(anon_art_classifier, attack_feature=attack_feature)\n",
     "\n",
     "# get original model's predictions\n",
@@ -353,7 +741,7 @@
     "anon_bb_attack.fit(train_encoded[:attack_train_size])\n",
     "\n",
     "# get inferred values\n",
-    "inferred_train_anon_bb = anon_bb_attack.infer(x_train_for_attack[attack_train_size:], anon_x_train_predictions[attack_train_size:], values=values)\n",
+    "inferred_train_anon_bb = anon_bb_attack.infer(x_train_for_attack[attack_train_size:], pred=anon_x_train_predictions[attack_train_size:], values=values)\n",
     "# check accuracy\n",
     "train_acc = np.sum(inferred_train_anon_bb == np.around(x_train_feature[attack_train_size:], decimals=8).reshape(1,-1)) / len(inferred_train_anon_bb)\n",
     "print(train_acc)"
@@ -368,14 +756,14 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 11,
+   "execution_count": 131,
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "0.5245996527107852\n"
+      "0.6857032606598495\n"
      ]
     }
    ],
@@ -399,15 +787,15 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 12,
+   "execution_count": 132,
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "(0.49415432579890883, 0.48976438779451525)\n",
-      "(0.49415432579890883, 0.48976438779451525)\n"
+      "(0.3353658536585366, 0.22540983606557377)\n",
+      "(0.3354908306364617, 0.18208430913348947)\n"
      ]
     }
    ],
@@ -444,15 +832,15 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 13,
+   "execution_count": 133,
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "(1.0, 0.019204655674102813)\n",
-      "(0.9829787234042553, 0.04481086323957323)\n"
+      "(0.6457357075913777, 0.2002324905550712)\n",
+      "(0.6384266263237519, 0.12263876780005813)\n"
      ]
     }
    ],
@@ -483,24 +871,26 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 14,
+   "execution_count": 134,
    "metadata": {},
    "outputs": [],
    "source": [
-    "anonymizer2 = Anonymize(1000, QI_indexes, categorical_features=categorical_features_indexes)\n",
+    "anonymizer2 = Anonymize(1000, QI, categorical_features=categorical_features)\n",
     "anon2 = anonymizer2.anonymize(ArrayDataset(x_train, x_train_predictions))"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 15,
+   "execution_count": 135,
    "metadata": {},
    "outputs": [
     {
      "data": {
-      "text/plain": "4226"
+      "text/plain": [
+       "1727"
+      ]
      },
-     "execution_count": 15,
+     "execution_count": 135,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -519,20 +909,20 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 16,
+   "execution_count": 136,
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Anonymized model accuracy:  0.9930555555555556\n"
+      "Anonymized model accuracy:  0.8981481481481481\n"
      ]
     }
    ],
    "source": [
-    "anon2_str = anon2.astype(str)\n",
-    "anon2_encoded = OneHotEncoder(sparse=False).fit_transform(anon2_str)\n",
+    "anon2_encoded = preprocessor.fit_transform(anon2)\n",
+    "test_encoded = preprocessor.transform(x_test)\n",
     "\n",
     "anon2_model = DecisionTreeClassifier()\n",
     "anon2_model.fit(anon2_encoded, y_train)\n",
@@ -552,18 +942,23 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 17,
+   "execution_count": 137,
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "1.0\n"
+      "0.546015820953116\n"
      ]
     }
    ],
    "source": [
+    "# training data without attacked feature\n",
+    "x_train_for_attack = np.delete(train_encoded, attack_feature, 1)\n",
+    "# only attacked feature\n",
+    "x_train_feature = train_encoded[:, attack_feature].copy().reshape(-1, 1)\n",
+    "\n",
     "anon2_bb_attack = AttributeInferenceBlackBox(anon2_art_classifier, attack_feature=attack_feature)\n",
     "\n",
     "# get original model's predictions\n",
@@ -573,7 +968,7 @@
     "anon2_bb_attack.fit(train_encoded[:attack_train_size])\n",
     "\n",
     "# get inferred values\n",
-    "inferred_train_anon2_bb = anon2_bb_attack.infer(x_train_for_attack[attack_train_size:], anon2_x_train_predictions[attack_train_size:], values=values)\n",
+    "inferred_train_anon2_bb = anon2_bb_attack.infer(x_train_for_attack[attack_train_size:], pred=anon2_x_train_predictions[attack_train_size:], values=values)\n",
     "# check accuracy\n",
     "train_acc = np.sum(inferred_train_anon2_bb == np.around(x_train_feature[attack_train_size:], decimals=8).reshape(1,-1)) / len(inferred_train_anon2_bb)\n",
     "print(train_acc)"
@@ -588,14 +983,14 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 18,
+   "execution_count": 138,
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "0.515820953115956\n"
+      "0.6680493922438742\n"
      ]
     }
    ],
@@ -612,17 +1007,17 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 19,
+   "execution_count": 139,
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "(0.49415432579890883, 0.48976438779451525)\n",
-      "(0.49415432579890883, 0.48976438779451525)\n",
-      "(1.0, 0.019204655674102813)\n",
-      "(1.0, 0.026382153249272552)\n"
+      "(0.3353658536585366, 0.22540983606557377)\n",
+      "(0.32242990654205606, 0.16159250585480095)\n",
+      "(0.6457357075913777, 0.2002324905550712)\n",
+      "(1, 0.0)\n"
      ]
     }
    ],
@@ -655,26 +1050,27 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 20,
+   "execution_count": 140,
    "metadata": {},
    "outputs": [],
    "source": [
     "QI2 = [\"parents\", \"has_nurs\", \"form\", \"children\", \"housing\", \"finance\", \"social\", \"health\"]\n",
-    "QI2_indexes = [i for i, v in enumerate(features) if v in QI2]\n",
-    "anonymizer3 = Anonymize(100, QI2_indexes, categorical_features=categorical_features_indexes)\n",
+    "anonymizer3 = Anonymize(100, QI2, categorical_features=categorical_features)\n",
     "anon3 = anonymizer3.anonymize(ArrayDataset(x_train, x_train_predictions))"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 21,
+   "execution_count": 141,
    "metadata": {},
    "outputs": [
     {
      "data": {
-      "text/plain": "39"
+      "text/plain": [
+       "39"
+      ]
      },
-     "execution_count": 21,
+     "execution_count": 141,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -686,22 +1082,22 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 22,
+   "execution_count": 142,
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Anonymized model accuracy:  0.751929012345679\n",
-      "BB attack accuracy:  1.0\n",
-      "WB attack accuracy:  0.5187150299054601\n"
+      "Anonymized model accuracy:  0.7600308641975309\n",
+      "BB attack accuracy:  0.5330889446266641\n",
+      "WB attack accuracy:  0.6680493922438742\n"
      ]
     }
    ],
    "source": [
-    "anon3_str = anon3.astype(str)\n",
-    "anon3_encoded = OneHotEncoder(sparse=False).fit_transform(anon3_str)\n",
+    "anon3_encoded = preprocessor.fit_transform(anon3)\n",
+    "test_encoded = preprocessor.transform(x_test)\n",
     "\n",
     "anon3_model = DecisionTreeClassifier()\n",
     "anon3_model.fit(anon3_encoded, y_train)\n",
@@ -710,6 +1106,11 @@
     "\n",
     "print('Anonymized model accuracy: ', anon3_model.score(test_encoded, y_test))\n",
     "\n",
+    "# training data without attacked feature\n",
+    "x_train_for_attack = np.delete(train_encoded, attack_feature, 1)\n",
+    "# only attacked feature\n",
+    "x_train_feature = train_encoded[:, attack_feature].copy().reshape(-1, 1)\n",
+    "\n",
     "anon3_bb_attack = AttributeInferenceBlackBox(anon3_art_classifier, attack_feature=attack_feature)\n",
     "\n",
     "# get original model's predictions\n",
@@ -719,7 +1120,7 @@
     "anon3_bb_attack.fit(train_encoded[:attack_train_size])\n",
     "\n",
     "# get inferred values\n",
-    "inferred_train_anon3_bb = anon3_bb_attack.infer(x_train_for_attack[attack_train_size:], anon3_x_train_predictions[attack_train_size:], values=values)\n",
+    "inferred_train_anon3_bb = anon3_bb_attack.infer(x_train_for_attack[attack_train_size:], pred=anon3_x_train_predictions[attack_train_size:], values=values)\n",
     "# check accuracy\n",
     "train_acc = np.sum(inferred_train_anon3_bb == np.around(x_train_feature[attack_train_size:], decimals=8).reshape(1,-1)) / len(inferred_train_anon2_bb)\n",
     "print('BB attack accuracy: ', train_acc)\n",
@@ -736,17 +1137,17 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 23,
+   "execution_count": 143,
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "(0.49415432579890883, 0.48976438779451525)\n",
-      "(0.49415432579890883, 0.48976438779451525)\n",
-      "(1.0, 0.019204655674102813)\n",
-      "(1.0, 0.032201745877788554)\n"
+      "(0.3353658536585366, 0.22540983606557377)\n",
+      "(0.344644750795334, 0.19028103044496486)\n",
+      "(0.6457357075913777, 0.2002324905550712)\n",
+      "(1, 0.0)\n"
      ]
     }
    ],
@@ -793,4 +1194,4 @@
  },
  "nbformat": 4,
  "nbformat_minor": 2
-}
\ No newline at end of file
+}
diff --git a/notebooks/minimization_adult.ipynb b/notebooks/minimization_adult.ipynb
index e8ccc20..a5a56ab 100644
--- a/notebooks/minimization_adult.ipynb
+++ b/notebooks/minimization_adult.ipynb
@@ -27,7 +27,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 15,
+   "execution_count": 1,
    "metadata": {},
    "outputs": [
     {
@@ -42,18 +42,6 @@
       " [2.2000e+01 9.0000e+00 0.0000e+00 0.0000e+00 2.0000e+01]\n",
       " [5.2000e+01 9.0000e+00 1.5024e+04 0.0000e+00 4.0000e+01]]\n"
      ]
-    },
-    {
-     "name": "stderr",
-     "output_type": "stream",
-     "text": [
-      "/var/folders/9b/qbtw28w53355cvpjs4qn83yc0000gn/T/ipykernel_13726/1357868359.py:22: DeprecationWarning: `np.int` is a deprecated alias for the builtin `int`. To silence this warning, use `int` by itself. Doing this will not modify any behavior and is safe. When replacing `np.int`, you may wish to use e.g. `np.int64` or `np.int32` to specify the precision. If you wish to review your current use, check the release note link for additional information.\n",
-      "Deprecated in NumPy 1.20; for more details and guidance: https://numpy.org/devdocs/release/1.20.0-notes.html#deprecations\n",
-      "  y_train = y_train.astype(np.int)\n",
-      "/var/folders/9b/qbtw28w53355cvpjs4qn83yc0000gn/T/ipykernel_13726/1357868359.py:26: DeprecationWarning: `np.int` is a deprecated alias for the builtin `int`. To silence this warning, use `int` by itself. Doing this will not modify any behavior and is safe. When replacing `np.int`, you may wish to use e.g. `np.int64` or `np.int32` to specify the precision. If you wish to review your current use, check the release note link for additional information.\n",
-      "Deprecated in NumPy 1.20; for more details and guidance: https://numpy.org/devdocs/release/1.20.0-notes.html#deprecations\n",
-      "  y_test = y_test.astype(np.int)\n"
-     ]
     }
    ],
    "source": [
@@ -96,24 +84,28 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 16,
+   "execution_count": 2,
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Base model accuracy:  0.8183158282660771\n"
+      "Base model accuracy:  0.8190528837295007\n"
      ]
     }
    ],
    "source": [
+    "import os\n",
+    "import sys\n",
+    "sys.path.insert(0, os.path.abspath('..'))\n",
+    "\n",
     "from apt.utils.datasets import ArrayDataset\n",
     "from apt.utils.models import SklearnClassifier, ModelOutputType\n",
     "from sklearn.tree import DecisionTreeClassifier\n",
     "\n",
     "base_est = DecisionTreeClassifier()\n",
-    "model = SklearnClassifier(base_est, ModelOutputType.CLASSIFIER_VECTOR)\n",
+    "model = SklearnClassifier(base_est, ModelOutputType.CLASSIFIER_PROBABILITIES)\n",
     "model.fit(ArrayDataset(x_train, y_train))\n",
     "\n",
     "print('Base model accuracy: ', model.score(ArrayDataset(x_test, y_test)))"
@@ -129,34 +121,30 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 17,
+   "execution_count": 4,
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Initial accuracy of model on generalized data, relative to original model predictions (base generalization derived from tree, before improvements): 0.936540\n",
+      "Initial accuracy of model on generalized data, relative to original model predictions (base generalization derived from tree, before improvements): 0.920665\n",
       "Improving accuracy\n",
-      "feature to remove: 2\n",
-      "Removed feature: 2, new relative accuracy: 0.935261\n",
-      "feature to remove: 4\n",
-      "Removed feature: 4, new relative accuracy: 0.946776\n",
-      "feature to remove: 0\n",
-      "Removed feature: 0, new relative accuracy: 0.972876\n",
       "feature to remove: 1\n",
-      "Removed feature: 1, new relative accuracy: 0.992835\n",
+      "Removed feature: 1, new relative accuracy: 0.920026\n",
+      "feature to remove: 0\n",
+      "Removed feature: 0, new relative accuracy: 0.938580\n",
+      "feature to remove: 4\n",
+      "Removed feature: 4, new relative accuracy: 0.987204\n",
+      "feature to remove: 2\n",
+      "Removed feature: 2, new relative accuracy: 0.992962\n",
       "feature to remove: 3\n",
       "Removed feature: 3, new relative accuracy: 1.000000\n",
-      "Accuracy on minimized data:  0.8231229847996315\n"
+      "Accuracy on minimized data:  0.8165771297006907\n"
      ]
     }
    ],
    "source": [
-    "import sys\n",
-    "import os\n",
-    "sys.path.insert(0, os.path.abspath('..'))\n",
-    "\n",
     "from apt.minimization import GeneralizeToRepresentative\n",
     "from sklearn.model_selection import train_test_split\n",
     "\n",
@@ -169,7 +157,7 @@
     "# Don't forget to leave a hold-out set for final validation!\n",
     "X_generalizer_train, x_test, y_generalizer_train, y_test = train_test_split(x_test, y_test, stratify=y_test,\n",
     "                                                                test_size = 0.4, random_state = 38)\n",
-    "x_train_predictions = model.predict(X_generalizer_train)\n",
+    "x_train_predictions = model.predict(ArrayDataset(X_generalizer_train))\n",
     "if x_train_predictions.shape[1] > 1:\n",
     "    x_train_predictions = np.argmax(x_train_predictions, axis=1)\n",
     "minimizer.fit(dataset=ArrayDataset(X_generalizer_train, x_train_predictions))\n",
@@ -187,14 +175,14 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 18,
+   "execution_count": 5,
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "{'ranges': {}, 'categories': {}, 'untouched': ['4', '1', '3', '0', '2']}\n"
+      "{'ranges': {}, 'categories': {}, 'untouched': ['2', '4', '3', '1', '0']}\n"
      ]
     }
    ],
@@ -214,25 +202,25 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 19,
+   "execution_count": 6,
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Initial accuracy of model on generalized data, relative to original model predictions (base generalization derived from tree, before improvements): 0.936540\n",
+      "Initial accuracy of model on generalized data, relative to original model predictions (base generalization derived from tree, before improvements): 0.920665\n",
       "Improving accuracy\n",
-      "feature to remove: 2\n",
-      "Removed feature: 2, new relative accuracy: 0.935261\n",
-      "feature to remove: 4\n",
-      "Removed feature: 4, new relative accuracy: 0.946776\n",
-      "feature to remove: 0\n",
-      "Removed feature: 0, new relative accuracy: 0.972876\n",
       "feature to remove: 1\n",
-      "Removed feature: 1, new relative accuracy: 0.992835\n",
-      "Accuracy on minimized data:  0.8192845079072624\n",
-      "{'ranges': {'3': [569.0, 782.0, 870.0, 870.5, 938.0, 1016.5, 1311.5, 1457.0, 1494.5, 1596.0, 1629.5, 1684.0, 1805.0, 1859.0, 1867.5, 1881.5, 1938.0, 1978.5, 2119.0, 2210.0, 2218.0, 2244.5, 2298.5, 2443.5]}, 'categories': {}, 'untouched': ['2', '1', '0', '4']}\n"
+      "Removed feature: 1, new relative accuracy: 0.920026\n",
+      "feature to remove: 0\n",
+      "Removed feature: 0, new relative accuracy: 0.938580\n",
+      "feature to remove: 4\n",
+      "Removed feature: 4, new relative accuracy: 0.987204\n",
+      "feature to remove: 2\n",
+      "Removed feature: 2, new relative accuracy: 0.992962\n",
+      "Accuracy on minimized data:  0.8100537221795856\n",
+      "{'ranges': {'3': [704.0, 782.0, 870.0, 951.0, 1588.0, 1647.5, 1684.0, 1805.0, 1923.0, 2168.5]}, 'categories': {}, 'untouched': ['2', '4', '1', '0']}\n"
      ]
     }
    ],
@@ -276,4 +264,4 @@
  },
  "nbformat": 4,
  "nbformat_minor": 2
-}
\ No newline at end of file
+}
diff --git a/notebooks/minimization_diabetes_reg.ipynb b/notebooks/minimization_diabetes_reg.ipynb
index 597d77a..b8fc2fb 100644
--- a/notebooks/minimization_diabetes_reg.ipynb
+++ b/notebooks/minimization_diabetes_reg.ipynb
@@ -14,31 +14,33 @@
   },
   {
    "cell_type": "markdown",
+   "metadata": {},
    "source": [
     "In this tutorial we will show how to perform data minimization for regression ML models using the minimization module.\n",
     "\n",
     "We will show you applying data minimization to a different trained regression models."
-   ],
-   "metadata": {
-    "collapsed": false
-   }
+   ]
   },
   {
    "cell_type": "markdown",
-   "source": [
-    "## Load data\n",
-    "QI parameter determines which features will be minimized."
-   ],
    "metadata": {
-    "collapsed": false,
     "pycharm": {
      "name": "#%% md\n"
     }
-   }
+   },
+   "source": [
+    "## Load data\n",
+    "QI parameter determines which features will be minimized."
+   ]
   },
   {
    "cell_type": "code",
-   "execution_count": 54,
+   "execution_count": 7,
+   "metadata": {
+    "pycharm": {
+     "name": "#%%\n"
+    }
+   },
    "outputs": [],
    "source": [
     "from sklearn.datasets import load_diabetes\n",
@@ -49,27 +51,24 @@
     "\n",
     "features = ['age', 'sex', 'bmi', 'bp',\n",
     "                's1', 's2', 's3', 's4', 's5', 's6']\n",
-    "QI = [0, 2, 5, 8, 9]"
-   ],
-   "metadata": {
-    "collapsed": false,
-    "pycharm": {
-     "name": "#%%\n"
-    }
-   }
+    "QI = ['age', 'bmi', 's2', 's5', 's6']"
+   ]
   },
   {
    "cell_type": "markdown",
+   "metadata": {},
    "source": [
     "## Train DecisionTreeRegressor model"
-   ],
-   "metadata": {
-    "collapsed": false
-   }
+   ]
   },
   {
    "cell_type": "code",
-   "execution_count": 55,
+   "execution_count": 8,
+   "metadata": {
+    "pycharm": {
+     "name": "#%%\n"
+    }
+   },
    "outputs": [
     {
      "name": "stdout",
@@ -86,27 +85,24 @@
     "model1 = DecisionTreeRegressor(random_state=10, min_samples_split=2)\n",
     "model1.fit(X_train, y_train)\n",
     "print('Base model accuracy (R2 score): ', model1.score(X_test, y_test))"
-   ],
-   "metadata": {
-    "collapsed": false,
-    "pycharm": {
-     "name": "#%%\n"
-    }
-   }
+   ]
   },
   {
    "cell_type": "markdown",
+   "metadata": {},
    "source": [
     "## Run minimization\n",
     "We will try to run minimization with only a subset of the features."
-   ],
-   "metadata": {
-    "collapsed": false
-   }
+   ]
   },
   {
    "cell_type": "code",
-   "execution_count": 56,
+   "execution_count": 9,
+   "metadata": {
+    "pycharm": {
+     "name": "#%%\n"
+    }
+   },
    "outputs": [
     {
      "name": "stdout",
@@ -121,14 +117,14 @@
       "feature to remove: bmi\n",
       "Removed feature: bmi, new relative accuracy: 0.718978\n",
       "Accuracy on minimized data:  0.11604533946025941\n",
-      "generalizations:  {'ranges': {'age': [-0.07090024650096893, -0.043656209483742714, -0.041839939542114735, -0.03639113181270659, -0.01459590089507401, -0.012779632292222232, -0.009147093165665865, -0.0036982858437113464, 0.03989217430353165, 0.039892176166176796, 0.05623859912157059, 0.06713621318340302], 's2': [-0.0550188384950161, -0.0285577941685915, -0.024643437936902046, -0.02135537937283516, -0.013683241792023182, -0.006480826530605555, 0.009176596067845821, 0.023111702874302864, 0.02420772146433592, 0.02655633445829153, 0.039082273840904236]}, 'categories': {}, 'untouched': ['s3', 'bmi', 's6', 'bp', 's4', 's5', 'sex', 's1']}\n"
+      "generalizations:  {'ranges': {'age': [-0.07090024650096893, -0.043656209483742714, -0.041839939542114735, -0.03639113181270659, -0.01459590089507401, -0.012779632292222232, -0.009147093165665865, -0.0036982858437113464, 0.03989217430353165, 0.039892176166176796, 0.05623859912157059, 0.06713621318340302], 's2': [-0.0550188384950161, -0.0285577941685915, -0.024643437936902046, -0.02135537937283516, -0.013683241792023182, -0.006480826530605555, 0.009176596067845821, 0.023111702874302864, 0.02420772146433592, 0.02655633445829153, 0.039082273840904236]}, 'categories': {}, 'untouched': ['s3', 's6', 's5', 'bp', 'bmi', 's4', 's1', 'sex']}\n"
      ]
     }
    ],
    "source": [
     "# note that is_regression param is True\n",
     "\n",
-    "minimizer1 = GeneralizeToRepresentative(model1, target_accuracy=0.7, features=features, is_regression=True,\n",
+    "minimizer1 = GeneralizeToRepresentative(model1, target_accuracy=0.7, is_regression=True,\n",
     "                                    features_to_minimize=QI)\n",
     "\n",
     "# Fitting the minimizar can be done either on training or test data. Doing it with test data is better as the\n",
@@ -139,32 +135,40 @@
     "                                                                test_size = 0.4, random_state = 38)\n",
     "\n",
     "x_train_predictions1 = model1.predict(X_generalizer_train1)\n",
-    "minimizer1.fit(X_generalizer_train1, x_train_predictions1)\n",
-    "transformed1 = minimizer1.transform(x_test1)\n",
+    "minimizer1.fit(X_generalizer_train1, x_train_predictions1, features_names=features)\n",
+    "transformed1 = minimizer1.transform(x_test1, features_names=features)\n",
     "print('Accuracy on minimized data: ', model1.score(transformed1, y_test1))\n",
     "print('generalizations: ',minimizer1.generalizations_)#%% md"
-   ],
-   "metadata": {
-    "collapsed": false,
-    "pycharm": {
-     "name": "#%%\n"
-    }
-   }
+   ]
   },
   {
    "cell_type": "markdown",
-   "source": [
-    "## Train linear regression model"
-   ],
    "metadata": {
-    "collapsed": false,
     "pycharm": {
      "name": "#%% md\n"
     }
-   }
+   },
+   "source": [
+    "## Train linear regression model"
+   ]
   },
   {
    "cell_type": "code",
+   "execution_count": 10,
+   "metadata": {
+    "pycharm": {
+     "name": "#%%\n"
+    }
+   },
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Base model accuracy (R2 score):  0.5080618258593723\n"
+     ]
+    }
+   ],
    "source": [
     "from sklearn.linear_model import LinearRegression\n",
     "from apt.minimization import GeneralizeToRepresentative\n",
@@ -172,49 +176,42 @@
     "model2 = LinearRegression()\n",
     "model2.fit(X_train, y_train)\n",
     "print('Base model accuracy (R2 score): ', model2.score(X_test, y_test))"
-   ],
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Run minimization\n",
+    "We will try to run minimization with only a subset of the features."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 12,
    "metadata": {
-    "collapsed": false,
     "pycharm": {
      "name": "#%%\n"
     }
    },
-   "execution_count": null,
-   "outputs": []
-  },
-  {
-   "cell_type": "markdown",
-   "source": [
-    "## Run minimization\n",
-    "We will try to run minimization with only a subset of the features."
-   ],
-   "metadata": {
-    "collapsed": false
-   }
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 58,
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Initial accuracy of model on generalized data, relative to original model predictions (base generalization derived from tree, before improvements): 0.225782\n",
+      "Initial accuracy of model on generalized data, relative to original model predictions (base generalization derived from tree, before improvements): 0.355377\n",
       "Improving accuracy\n",
-      "feature to remove: age\n",
-      "Removed feature: age, new relative accuracy: 0.223565\n",
       "feature to remove: s2\n",
-      "Removed feature: s2, new relative accuracy: 0.759788\n",
-      "Accuracy on minimized data:  0.4414329261774286\n",
-      "generalizations:  {'ranges': {'bmi': [-0.0660245232284069, -0.06171327643096447, -0.048779530450701714, -0.036923596635460854, -0.022912041284143925, -0.015906263142824173, -0.009978296235203743, 0.007266696775332093, 0.022356065921485424, 0.028822937980294228, 0.04499012045562267, 0.053073709830641747, 0.10103634744882584], 's5': [-0.08940735459327698, -0.07823517918586731, -0.07310866191983223, -0.07022909820079803, -0.06740894541144371, -0.06558558344841003, -0.041897499933838844, -0.04049498960375786, -0.03781316243112087, -0.033939776942133904, -0.03263746201992035, -0.02538660168647766, -0.023219254799187183, -0.017585186287760735, -0.016525186598300934, -0.008522996446117759, 0.0015758189256303012, 0.012934560421854258, 0.014069339726120234, 0.015929921995848417, 0.01947084255516529, 0.028651678003370762, 0.03358383011072874, 0.03639278281480074, 0.041416410356760025, 0.06386702693998814], 's6': [-0.07356456853449345, -0.052854035049676895, -0.048711927607655525, -0.0383566590026021, -0.02800139266764745, -0.021788232028484344, -0.007290858076885343, -0.007290857844054699, 0.017561784014105797, 0.02377494378015399, 0.02791705122217536, 0.02998810407007113, 0.054840744473040104]}, 'categories': {}, 'untouched': ['s2', 's3', 'bp', 's4', 'age', 'sex', 's1']}\n"
+      "Removed feature: s2, new relative accuracy: 0.773233\n",
+      "Accuracy on minimized data:  0.3945625296515525\n",
+      "generalizations:  {'ranges': {'age': [-0.06181889958679676, -0.027309785597026348, -0.012779631884768605, -0.0036982858437113464, -0.001882016658782959, 0.0035667913034558296, 0.01991321425884962, 0.021729483967646956, 0.02717829099856317, 0.04534098319709301, 0.05805486813187599], 'bmi': [-0.0660245232284069, -0.06171327643096447, -0.048779530450701714, -0.036923596635460854, -0.022912041284143925, -0.015906263142824173, -0.009978296235203743, 0.007266696775332093, 0.022356065921485424, 0.028822937980294228, 0.04499012045562267, 0.04876246117055416, 0.053073709830641747, 0.10103634744882584], 's5': [-0.08940735459327698, -0.07823517918586731, -0.07310866191983223, -0.07022909820079803, -0.06740894541144371, -0.06558558344841003, -0.041897499933838844, -0.03781316243112087, -0.033939776942133904, -0.03263746201992035, -0.02538660168647766, -0.023219254799187183, -0.017585186287760735, -0.016525186598300934, -0.008522996446117759, -0.0048803192912600935, 0.0002040128456428647, 0.0015758189256303012, 0.008132445393130183, 0.012934560421854258, 0.014069339726120234, 0.015929921995848417, 0.01947084255516529, 0.028651678003370762, 0.03358383011072874, 0.03639278281480074, 0.041416410356760025], 's6': [-0.07356456853449345, -0.052854035049676895, -0.048711927607655525, -0.044569820165634155, -0.0383566590026021, -0.021788232028484344, -0.017646125052124262, -0.013504017610102892, 0.02377494378015399, 0.06519601307809353, 0.08383549377322197]}, 'categories': {}, 'untouched': ['s3', 's2', 'bp', 's4', 's1', 'sex']}\n"
      ]
     }
    ],
    "source": [
     "# note that is_regression param is True\n",
     "\n",
-    "minimizer2 = GeneralizeToRepresentative(model2, target_accuracy=0.7, features=features, is_regression=True,\n",
+    "minimizer2 = GeneralizeToRepresentative(model2, target_accuracy=0.7, is_regression=True,\n",
     "                                    features_to_minimize=QI)\n",
     "\n",
     "# Fitting the minimizar can be done either on training or test data. Doing it with test data is better as the\n",
@@ -225,17 +222,11 @@
     "                                                                test_size = 0.4, random_state = 38)\n",
     "\n",
     "x_train_predictions2 = model2.predict(X_generalizer_train2)\n",
-    "minimizer2.fit(X_generalizer_train2, x_train_predictions2)\n",
-    "transformed2 = minimizer2.transform(x_test2)\n",
+    "minimizer2.fit(X_generalizer_train2, x_train_predictions2, features_names=features)\n",
+    "transformed2 = minimizer2.transform(x_test2, features_names=features)\n",
     "print('Accuracy on minimized data: ', model2.score(transformed2, y_test2))\n",
     "print('generalizations: ',minimizer2.generalizations_)"
-   ],
-   "metadata": {
-    "collapsed": false,
-    "pycharm": {
-     "name": "#%%\n"
-    }
-   }
+   ]
   }
  ],
  "metadata": {
@@ -247,16 +238,16 @@
   "language_info": {
    "codemirror_mode": {
     "name": "ipython",
-    "version": 2
+    "version": 3
    },
    "file_extension": ".py",
    "mimetype": "text/x-python",
    "name": "python",
    "nbconvert_exporter": "python",
-   "pygments_lexer": "ipython2",
-   "version": "2.7.6"
+   "pygments_lexer": "ipython3",
+   "version": "3.8.3"
   }
  },
  "nbformat": 4,
- "nbformat_minor": 0
-}
\ No newline at end of file
+ "nbformat_minor": 1
+}
diff --git a/notebooks/minimization_german_credit.ipynb b/notebooks/minimization_german_credit.ipynb
index 03af5f0..03a4cce 100644
--- a/notebooks/minimization_german_credit.ipynb
+++ b/notebooks/minimization_german_credit.ipynb
@@ -2,37 +2,36 @@
  "cells": [
   {
    "cell_type": "markdown",
+   "metadata": {},
    "source": [
     "# Applying data minimization with categorical data and only a subset of the features to a trained ML model"
-   ],
-   "metadata": {
-    "collapsed": false
-   }
+   ]
   },
   {
    "cell_type": "markdown",
+   "metadata": {},
    "source": [
     "In this tutorial we will show how to perform data minimization for ML models using the minimization module.\n",
     "\n",
     "This will be demonstarted using the German Credit dataset (original dataset can be found here: https://archive.ics.uci.edu/ml/machine-learning-databases/statlog/german/german.data)."
-   ],
-   "metadata": {
-    "collapsed": false
-   }
+   ]
   },
   {
    "cell_type": "markdown",
+   "metadata": {},
    "source": [
     "## Load data\n",
     "QI parameter determines which features will be minimized."
-   ],
-   "metadata": {
-    "collapsed": false
-   }
+   ]
   },
   {
    "cell_type": "code",
-   "execution_count": 1,
+   "execution_count": 2,
+   "metadata": {
+    "pycharm": {
+     "name": "#%%\n"
+    }
+   },
    "outputs": [
     {
      "name": "stdout",
@@ -108,9 +107,13 @@
     }
    ],
    "source": [
-    "from apt.utils import get_german_credit_dataset\n",
+    "import os\n",
+    "import sys\n",
+    "sys.path.insert(0, os.path.abspath('..'))\n",
     "\n",
-    "(x_train, y_train), (x_test, y_test) = get_german_credit_dataset()\n",
+    "from apt.utils.dataset_utils import get_german_credit_dataset_pd\n",
+    "\n",
+    "(x_train, y_train), (x_test, y_test) = get_german_credit_dataset_pd()\n",
     "features = [\"Existing_checking_account\", \"Duration_in_month\", \"Credit_history\", \"Purpose\", \"Credit_amount\",\n",
     "                \"Savings_account\", \"Present_employment_since\", \"Installment_rate\", \"Personal_status_sex\", \"debtors\",\n",
     "                \"Present_residence\", \"Property\", \"Age\", \"Other_installment_plans\", \"Housing\",\n",
@@ -123,33 +126,30 @@
     "      \"Housing\", \"Job\"]\n",
     "\n",
     "print(x_train)"
-   ],
-   "metadata": {
-    "collapsed": false,
-    "pycharm": {
-     "name": "#%%\n"
-    }
-   }
+   ]
   },
   {
    "cell_type": "markdown",
+   "metadata": {},
    "source": [
     "## Train decision tree model\n",
     "we use OneHotEncoder to handle categorical features."
-   ],
-   "metadata": {
-    "collapsed": false
-   }
+   ]
   },
   {
    "cell_type": "code",
-   "execution_count": 2,
+   "execution_count": 3,
+   "metadata": {
+    "pycharm": {
+     "name": "#%%\n"
+    }
+   },
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Base model accuracy:  0.7033333333333334\n"
+      "Base model accuracy:  0.6933333333333334\n"
      ]
     }
    ],
@@ -176,50 +176,47 @@
     "\n",
     "encoded_test = preprocessor.transform(x_test)\n",
     "print('Base model accuracy: ', model.score(encoded_test, y_test))"
-   ],
-   "metadata": {
-    "collapsed": false,
-    "pycharm": {
-     "name": "#%%\n"
-    }
-   }
+   ]
   },
   {
    "cell_type": "markdown",
+   "metadata": {},
    "source": [
     "## Run minimization\n",
     "We will try to run minimization with categorical features and only a subset of the features with different possible values of target accuracy (how close to the original model's accuracy we want to get, 1 being same accuracy as for original data)."
-   ],
-   "metadata": {
-    "collapsed": false
-   }
+   ]
   },
   {
    "cell_type": "code",
-   "execution_count": 3,
+   "execution_count": 4,
+   "metadata": {
+    "pycharm": {
+     "name": "#%%\n"
+    }
+   },
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Initial accuracy of model on generalized data, relative to original model predictions (base generalization derived from tree, before improvements): 0.791667\n",
+      "Initial accuracy of model on generalized data, relative to original model predictions (base generalization derived from tree, before improvements): 0.805556\n",
       "Improving accuracy\n",
-      "feature to remove: Property\n",
-      "Removed feature: Property, new relative accuracy: 0.819444\n",
-      "feature to remove: Other_installment_plans\n",
-      "Removed feature: Other_installment_plans, new relative accuracy: 0.833333\n",
-      "feature to remove: Job\n",
-      "Removed feature: Job, new relative accuracy: 0.833333\n",
-      "feature to remove: Housing\n",
-      "Removed feature: Housing, new relative accuracy: 0.833333\n",
-      "feature to remove: Purpose\n",
-      "Removed feature: Purpose, new relative accuracy: 0.916667\n",
       "feature to remove: Credit_history\n",
-      "Removed feature: Credit_history, new relative accuracy: 0.930556\n",
-      "feature to remove: debtors\n",
-      "Removed feature: debtors, new relative accuracy: 0.944444\n",
+      "Removed feature: Credit_history, new relative accuracy: 0.819444\n",
+      "feature to remove: Other_installment_plans\n",
+      "Removed feature: Other_installment_plans, new relative accuracy: 0.847222\n",
       "feature to remove: Duration_in_month\n",
-      "Removed feature: Duration_in_month, new relative accuracy: 1.000000\n",
+      "Removed feature: Duration_in_month, new relative accuracy: 0.847222\n",
+      "feature to remove: Property\n",
+      "Removed feature: Property, new relative accuracy: 0.847222\n",
+      "feature to remove: Housing\n",
+      "Removed feature: Housing, new relative accuracy: 0.847222\n",
+      "feature to remove: Purpose\n",
+      "Removed feature: Purpose, new relative accuracy: 0.986111\n",
+      "feature to remove: debtors\n",
+      "Removed feature: debtors, new relative accuracy: 0.986111\n",
+      "feature to remove: Job\n",
+      "Removed feature: Job, new relative accuracy: 1.000000\n",
       "Accuracy on minimized data:  0.6666666666666666\n"
      ]
     }
@@ -233,7 +230,7 @@
     "from sklearn.model_selection import train_test_split\n",
     "\n",
     "# default target_accuracy is 0.998\n",
-    "minimizer = GeneralizeToRepresentative(model, features=features,\n",
+    "minimizer = GeneralizeToRepresentative(model, \n",
     "                                     categorical_features=categorical_features, features_to_minimize=QI)\n",
     "\n",
     "# Fitting the minimizar can be done either on training or test data. Doing it with test data is better as the\n",
@@ -248,117 +245,103 @@
     "y_test.reset_index(drop=True, inplace=True)\n",
     "encoded_generalizer_train = preprocessor.transform(X_generalizer_train)\n",
     "x_train_predictions = model.predict(encoded_generalizer_train)\n",
-    "minimizer.fit(X_generalizer_train, x_train_predictions)\n",
-    "transformed = minimizer.transform(x_test)\n",
+    "minimizer.fit(X_generalizer_train, x_train_predictions, features_names=features)\n",
+    "transformed = minimizer.transform(x_test, features_names=features)\n",
     "\n",
     "encoded_transformed = preprocessor.transform(transformed)\n",
     "print('Accuracy on minimized data: ', model.score(encoded_transformed, y_test))"
-   ],
-   "metadata": {
-    "collapsed": false,
-    "pycharm": {
-     "name": "#%%\n"
-    }
-   }
+   ]
   },
   {
    "cell_type": "markdown",
+   "metadata": {},
    "source": [
     "#### Let's see what features were generalized"
-   ],
-   "metadata": {
-    "collapsed": false
-   }
+   ]
   },
   {
    "cell_type": "code",
-   "execution_count": 4,
+   "execution_count": 5,
+   "metadata": {
+    "pycharm": {
+     "name": "#%%\n"
+    }
+   },
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "{'ranges': {}, 'categories': {}, 'untouched': ['Purpose', 'Present_residence', 'Credit_history', 'Telephone', 'Job', 'Housing', 'Installment_rate', 'Number_of_existing_credits', 'Foreign_worker', 'Existing_checking_account', 'Other_installment_plans', 'N_people_being_liable_provide_maintenance', 'Property', 'Savings_account', 'Present_employment_since', 'Personal_status_sex', 'Duration_in_month', 'debtors', 'Credit_amount', 'Age']}\n"
+      "{'ranges': {}, 'categories': {}, 'untouched': ['Foreign_worker', 'Other_installment_plans', 'Existing_checking_account', 'Purpose', 'debtors', 'Housing', 'N_people_being_liable_provide_maintenance', 'Present_employment_since', 'Installment_rate', 'Credit_history', 'Property', 'Present_residence', 'Age', 'Credit_amount', 'Duration_in_month', 'Job', 'Personal_status_sex', 'Number_of_existing_credits', 'Savings_account', 'Telephone']}\n"
      ]
     }
    ],
    "source": [
     "generalizations = minimizer.generalizations\n",
     "print(generalizations)"
-   ],
-   "metadata": {
-    "collapsed": false,
-    "pycharm": {
-     "name": "#%%\n"
-    }
-   }
+   ]
   },
   {
    "cell_type": "markdown",
+   "metadata": {},
    "source": [
     "We can see that for the default target accuracy of 0.998 of the original accuracy, no generalizations are possible (all features are left untouched, i.e., not generalized).\n",
     "\n",
     "Let's change to a slightly lower target accuracy."
-   ],
-   "metadata": {
-    "collapsed": false
-   }
+   ]
   },
   {
    "cell_type": "code",
-   "execution_count": 5,
+   "execution_count": 6,
+   "metadata": {
+    "pycharm": {
+     "name": "#%%\n"
+    }
+   },
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Initial accuracy of model on generalized data, relative to original model predictions (base generalization derived from tree, before improvements): 0.791667\n",
+      "Initial accuracy of model on generalized data, relative to original model predictions (base generalization derived from tree, before improvements): 0.805556\n",
       "Improving accuracy\n",
-      "feature to remove: Property\n",
-      "Removed feature: Property, new relative accuracy: 0.819444\n",
-      "feature to remove: Other_installment_plans\n",
-      "Removed feature: Other_installment_plans, new relative accuracy: 0.833333\n",
-      "feature to remove: Job\n",
-      "Removed feature: Job, new relative accuracy: 0.833333\n",
-      "feature to remove: Housing\n",
-      "Removed feature: Housing, new relative accuracy: 0.833333\n",
-      "feature to remove: Purpose\n",
-      "Removed feature: Purpose, new relative accuracy: 0.916667\n",
       "feature to remove: Credit_history\n",
-      "Removed feature: Credit_history, new relative accuracy: 0.930556\n",
-      "Accuracy on minimized data:  0.6416666666666667\n",
-      "{'ranges': {'Duration_in_month': [7.0, 8.5, 11.0, 13.0, 14.0, 18.0, 23.0, 25.5, 34.5, 47.5]}, 'categories': {'debtors': [['A101', 'A102'], ['A103']]}, 'untouched': ['Existing_checking_account', 'Savings_account', 'Present_employment_since', 'Property', 'Housing', 'Purpose', 'Personal_status_sex', 'Present_residence', 'Credit_history', 'Telephone', 'Installment_rate', 'Other_installment_plans', 'Number_of_existing_credits', 'Credit_amount', 'N_people_being_liable_provide_maintenance', 'Foreign_worker', 'Age', 'Job']}\n"
+      "Removed feature: Credit_history, new relative accuracy: 0.819444\n",
+      "feature to remove: Other_installment_plans\n",
+      "Removed feature: Other_installment_plans, new relative accuracy: 0.847222\n",
+      "feature to remove: Duration_in_month\n",
+      "Removed feature: Duration_in_month, new relative accuracy: 0.847222\n",
+      "feature to remove: Property\n",
+      "Removed feature: Property, new relative accuracy: 0.847222\n",
+      "feature to remove: Housing\n",
+      "Removed feature: Housing, new relative accuracy: 0.847222\n",
+      "feature to remove: Purpose\n",
+      "Removed feature: Purpose, new relative accuracy: 0.986111\n",
+      "Accuracy on minimized data:  0.6666666666666666\n",
+      "{'ranges': {}, 'categories': {'debtors': [['A103', 'A102'], ['A101']], 'Job': [['A173', 'A174'], ['A171'], ['A172']]}, 'untouched': ['Credit_amount', 'Duration_in_month', 'Credit_history', 'Foreign_worker', 'Housing', 'Other_installment_plans', 'Property', 'N_people_being_liable_provide_maintenance', 'Present_residence', 'Personal_status_sex', 'Telephone', 'Number_of_existing_credits', 'Present_employment_since', 'Existing_checking_account', 'Savings_account', 'Age', 'Purpose', 'Installment_rate']}\n"
      ]
     }
    ],
    "source": [
     "# We allow a 1% deviation in accuracy from the original model accuracy\n",
-    "minimizer2 = GeneralizeToRepresentative(model, target_accuracy=0.92, features=features,\n",
+    "minimizer2 = GeneralizeToRepresentative(model, target_accuracy=0.92, \n",
     "                                     categorical_features=categorical_features, features_to_minimize=QI)\n",
     "\n",
-    "minimizer2.fit(X_generalizer_train, x_train_predictions)\n",
-    "transformed2 = minimizer2.transform(x_test)\n",
+    "minimizer2.fit(X_generalizer_train, x_train_predictions, features_names=features)\n",
+    "transformed2 = minimizer2.transform(x_test, features_names=features)\n",
     "\n",
     "encoded_transformed2 = preprocessor.transform(transformed2)\n",
     "print('Accuracy on minimized data: ', model.score(encoded_transformed2, y_test))\n",
     "generalizations2 = minimizer2.generalizations\n",
     "print(generalizations2)"
-   ],
-   "metadata": {
-    "collapsed": false,
-    "pycharm": {
-     "name": "#%%\n"
-    }
-   }
+   ]
   },
   {
    "cell_type": "markdown",
+   "metadata": {},
    "source": [
-    "This time we were able to generalize two features (Duration_in_month and debtors)."
-   ],
-   "metadata": {
-    "collapsed": false
-   }
+    "This time we were able to generalize two features (debtors and Job)."
+   ]
   }
  ],
  "metadata": {
@@ -370,16 +353,16 @@
   "language_info": {
    "codemirror_mode": {
     "name": "ipython",
-    "version": 2
+    "version": 3
    },
    "file_extension": ".py",
    "mimetype": "text/x-python",
    "name": "python",
    "nbconvert_exporter": "python",
-   "pygments_lexer": "ipython2",
-   "version": "2.7.6"
+   "pygments_lexer": "ipython3",
+   "version": "3.8.3"
   }
  },
  "nbformat": 4,
- "nbformat_minor": 0
-}
\ No newline at end of file
+ "nbformat_minor": 1
+}
diff --git a/tests/test_anonymizer.py b/tests/test_anonymizer.py
index 358398c..12b6639 100644
--- a/tests/test_anonymizer.py
+++ b/tests/test_anonymizer.py
@@ -7,14 +7,14 @@ from sklearn.tree import DecisionTreeClassifier, DecisionTreeRegressor
 from sklearn.preprocessing import OneHotEncoder
 
 from apt.anonymization import Anonymize
-from apt.utils.dataset_utils import get_iris_dataset, get_adult_dataset, get_nursery_dataset
+from apt.utils.dataset_utils import get_iris_dataset_np, get_adult_dataset_pd, get_nursery_dataset_pd
 from sklearn.datasets import load_diabetes
 from sklearn.model_selection import train_test_split
-from apt.utils.datasets import ArrayDataset, DATA_PANDAS_NUMPY_TYPE
+from apt.utils.datasets import ArrayDataset
 
 
 def test_anonymize_ndarray_iris():
-    (x_train, y_train), _ = get_iris_dataset()
+    (x_train, y_train), _ = get_iris_dataset_np()
 
     model = DecisionTreeClassifier()
     model.fit(x_train, y_train)
@@ -31,11 +31,7 @@ def test_anonymize_ndarray_iris():
 
 
 def test_anonymize_pandas_adult():
-    (x_train, y_train), _ = get_adult_dataset()
-    encoded = OneHotEncoder().fit_transform(x_train)
-    model = DecisionTreeClassifier()
-    model.fit(encoded, y_train)
-    pred = model.predict(encoded)
+    (x_train, y_train), _ = get_adult_dataset_pd()
 
     k = 100
     features = ['age', 'workclass', 'education-num', 'marital-status', 'occupation', 'relationship', 'race', 'sex',
@@ -68,8 +64,9 @@ def test_anonymize_pandas_adult():
     assert (anon.loc[:, QI].value_counts().min() >= k)
     np.testing.assert_array_equal(anon.drop(QI, axis=1), x_train.drop(QI, axis=1))
 
+
 def test_anonymize_pandas_nursery():
-    (x_train, y_train), _ = get_nursery_dataset()
+    (x_train, y_train), _ = get_nursery_dataset_pd()
     x_train = x_train.astype(str)
 
     k = 100
@@ -102,7 +99,6 @@ def test_anonymize_pandas_nursery():
 
 
 def test_regression():
-
     dataset = load_diabetes()
     x_train, x_test, y_train, y_test = train_test_split(dataset.data, dataset.target, test_size=0.5, random_state=14)
 
@@ -130,9 +126,9 @@ def test_errors():
     with pytest.raises(ValueError):
         Anonymize(2, None)
     anonymizer = Anonymize(10, [0, 2])
-    (x_train, y_train), (x_test, y_test) = get_iris_dataset()
+    (x_train, y_train), (x_test, y_test) = get_iris_dataset_np()
     with pytest.raises(ValueError):
         anonymizer.anonymize(dataset=ArrayDataset(x_train, y_test))
-    (x_train, y_train), _ = get_adult_dataset()
+    (x_train, y_train), _ = get_adult_dataset_pd()
     with pytest.raises(ValueError):
         anonymizer.anonymize(dataset=ArrayDataset(x_train, y_test))
diff --git a/tests/test_minimizer.py b/tests/test_minimizer.py
index 630cd49..181755b 100644
--- a/tests/test_minimizer.py
+++ b/tests/test_minimizer.py
@@ -9,11 +9,14 @@ from sklearn.model_selection import train_test_split
 from sklearn.pipeline import Pipeline
 from sklearn.preprocessing import OneHotEncoder
 
+from tensorflow.keras.models import Sequential
+from tensorflow.keras.layers import Dense, Input
+
 from apt.minimization import GeneralizeToRepresentative
 from sklearn.tree import DecisionTreeClassifier, DecisionTreeRegressor
-from apt.utils.dataset_utils import get_iris_dataset, get_adult_dataset, get_nursery_dataset, get_german_credit_dataset
-from apt.utils.datasets import ArrayDataset
-from apt.utils.models import SklearnClassifier, ModelOutputType, SklearnRegressor
+from apt.utils.dataset_utils import get_iris_dataset_np, get_adult_dataset_pd, get_german_credit_dataset_pd
+from apt.utils.datasets import ArrayDataset, Data
+from apt.utils.models import SklearnClassifier, ModelOutputType, SklearnRegressor, KerasClassifier, BlackboxClassifier
 
 
 @pytest.fixture
@@ -39,7 +42,7 @@ def test_minimizer_params(data):
     y = [1, 1, 0]
     base_est = DecisionTreeClassifier(random_state=0, min_samples_split=2,
                                       min_samples_leaf=1)
-    model = SklearnClassifier(base_est, ModelOutputType.CLASSIFIER_VECTOR)
+    model = SklearnClassifier(base_est, ModelOutputType.CLASSIFIER_PROBABILITIES)
     model.fit(ArrayDataset(X, y))
 
     gen = GeneralizeToRepresentative(model, cells=cells)
@@ -63,9 +66,10 @@ def test_minimizer_fit(data):
     y = np.array([1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0])
     base_est = DecisionTreeClassifier(random_state=0, min_samples_split=2,
                                       min_samples_leaf=1)
-    model = SklearnClassifier(base_est, ModelOutputType.CLASSIFIER_VECTOR)
+    model = SklearnClassifier(base_est, ModelOutputType.CLASSIFIER_PROBABILITIES)
     model.fit(ArrayDataset(X, y))
-    predictions = model.predict(X)
+    ad = ArrayDataset(X)
+    predictions = model.predict(ad)
     if predictions.shape[1] > 1:
         predictions = np.argmax(predictions, axis=1)
 
@@ -73,26 +77,26 @@ def test_minimizer_fit(data):
     train_dataset = ArrayDataset(X, predictions, features_names=features)
 
     gen.fit(dataset=train_dataset)
-    transformed = gen.transform(dataset=ArrayDataset(X))
-    gener = gen.generalizations_
-    expexted_generalizations = {'ranges': {}, 'categories': {}, 'untouched': ['height', 'age']}
+    transformed = gen.transform(dataset=ad)
+    gener = gen.generalizations
+    expected_generalizations = {'ranges': {}, 'categories': {}, 'untouched': ['height', 'age']}
 
-    for key in expexted_generalizations['ranges']:
-        assert (set(expexted_generalizations['ranges'][key]) == set(gener['ranges'][key]))
-    for key in expexted_generalizations['categories']:
-        assert (set([frozenset(sl) for sl in expexted_generalizations['categories'][key]]) ==
+    for key in expected_generalizations['ranges']:
+        assert (set(expected_generalizations['ranges'][key]) == set(gener['ranges'][key]))
+    for key in expected_generalizations['categories']:
+        assert (set([frozenset(sl) for sl in expected_generalizations['categories'][key]]) ==
                 set([frozenset(sl) for sl in gener['categories'][key]]))
-    assert (set(expexted_generalizations['untouched']) == set(gener['untouched']))
+    assert (set(expected_generalizations['untouched']) == set(gener['untouched']))
     modified_features = [f for f in features if
-                         f in expexted_generalizations['categories'].keys() or f in expexted_generalizations[
+                         f in expected_generalizations['categories'].keys() or f in expected_generalizations[
                              'ranges'].keys()]
     indexes = []
     for i in range(len(features)):
         if features[i] in modified_features:
             indexes.append(i)
     assert ((np.delete(transformed, indexes, axis=1) == np.delete(X, indexes, axis=1)).all())
-    ncp = gen.ncp_
-    if len(expexted_generalizations['ranges'].keys()) > 0 or len(expexted_generalizations['categories'].keys()) > 0:
+    ncp = gen.ncp
+    if len(expected_generalizations['ranges'].keys()) > 0 or len(expected_generalizations['categories'].keys()) > 0:
         assert (ncp > 0)
         assert (((transformed[indexes]) != (X[indexes])).any())
 
@@ -131,9 +135,9 @@ def test_minimizer_fit_pandas(data):
     encoded = pd.DataFrame(encoded)
     base_est = DecisionTreeClassifier(random_state=0, min_samples_split=2,
                                       min_samples_leaf=1)
-    model = SklearnClassifier(base_est, ModelOutputType.CLASSIFIER_VECTOR)
+    model = SklearnClassifier(base_est, ModelOutputType.CLASSIFIER_PROBABILITIES)
     model.fit(ArrayDataset(encoded, y))
-    predictions = model.predict(encoded)
+    predictions = model.predict(ArrayDataset(encoded))
     if predictions.shape[1] > 1:
         predictions = np.argmax(predictions, axis=1)
 
@@ -144,21 +148,22 @@ def test_minimizer_fit_pandas(data):
     train_dataset = ArrayDataset(X, predictions)
     gen.fit(dataset=train_dataset)
     transformed = gen.transform(dataset=ArrayDataset(X))
-    gener = gen.generalizations_
-    expexted_generalizations = {'ranges': {'age': []}, 'categories': {}, 'untouched': ['ola', 'height', 'sex']}
+    gener = gen.generalizations
+    expected_generalizations = {'ranges': {'age': []}, 'categories': {'sex': [['f', 'm']], 'ola': [['aa', 'bb']]},
+                                'untouched': ['height']}
 
-    for key in expexted_generalizations['ranges']:
-        assert (set(expexted_generalizations['ranges'][key]) == set(gener['ranges'][key]))
-    for key in expexted_generalizations['categories']:
-        assert (set([frozenset(sl) for sl in expexted_generalizations['categories'][key]]) ==
+    for key in expected_generalizations['ranges']:
+        assert (set(expected_generalizations['ranges'][key]) == set(gener['ranges'][key]))
+    for key in expected_generalizations['categories']:
+        assert (set([frozenset(sl) for sl in expected_generalizations['categories'][key]]) ==
                 set([frozenset(sl) for sl in gener['categories'][key]]))
-    assert (set(expexted_generalizations['untouched']) == set(gener['untouched']))
+    assert (set(expected_generalizations['untouched']) == set(gener['untouched']))
     modified_features = [f for f in features if
-                         f in expexted_generalizations['categories'].keys() or f in expexted_generalizations[
+                         f in expected_generalizations['categories'].keys() or f in expected_generalizations[
                              'ranges'].keys()]
     np.testing.assert_array_equal(transformed.drop(modified_features, axis=1), X.drop(modified_features, axis=1))
-    ncp = gen.ncp_
-    if len(expexted_generalizations['ranges'].keys()) > 0 or len(expexted_generalizations['categories'].keys()) > 0:
+    ncp = gen.ncp
+    if len(expected_generalizations['ranges'].keys()) > 0 or len(expected_generalizations['categories'].keys()) > 0:
         assert (ncp > 0)
         assert (((transformed[modified_features]).equals(X[modified_features])) == False)
 
@@ -212,9 +217,9 @@ def test_minimizer_params_categorical(data):
     encoded = pd.DataFrame(encoded)
     base_est = DecisionTreeClassifier(random_state=0, min_samples_split=2,
                                       min_samples_leaf=1)
-    model = SklearnClassifier(base_est, ModelOutputType.CLASSIFIER_VECTOR)
+    model = SklearnClassifier(base_est, ModelOutputType.CLASSIFIER_PROBABILITIES)
     model.fit(ArrayDataset(encoded, y))
-    predictions = model.predict(encoded)
+    predictions = model.predict(ArrayDataset(encoded))
     if predictions.shape[1] > 1:
         predictions = np.argmax(predictions, axis=1)
     # Append classifier to preprocessing pipeline.
@@ -244,35 +249,36 @@ def test_minimizer_fit_QI(data):
     QI = ['age', 'weight']
     base_est = DecisionTreeClassifier(random_state=0, min_samples_split=2,
                                       min_samples_leaf=1)
-    model = SklearnClassifier(base_est, ModelOutputType.CLASSIFIER_VECTOR)
+    model = SklearnClassifier(base_est, ModelOutputType.CLASSIFIER_PROBABILITIES)
     model.fit(ArrayDataset(X, y))
-    predictions = model.predict(X)
+    ad = ArrayDataset(X)
+    predictions = model.predict(ad)
     if predictions.shape[1] > 1:
         predictions = np.argmax(predictions, axis=1)
 
     gen = GeneralizeToRepresentative(model, target_accuracy=0.5, features_to_minimize=QI)
     train_dataset = ArrayDataset(X, predictions, features_names=features)
     gen.fit(dataset=train_dataset)
-    transformed = gen.transform(dataset=ArrayDataset(X))
-    gener = gen.generalizations_
-    expexted_generalizations = {'ranges': {'age': [], 'weight': [67.5]}, 'categories': {}, 'untouched': ['height']}
-    for key in expexted_generalizations['ranges']:
-        assert (set(expexted_generalizations['ranges'][key]) == set(gener['ranges'][key]))
-    for key in expexted_generalizations['categories']:
-        assert (set([frozenset(sl) for sl in expexted_generalizations['categories'][key]]) ==
+    transformed = gen.transform(dataset=ad)
+    gener = gen.generalizations
+    expected_generalizations = {'ranges': {'age': [], 'weight': [67.5]}, 'categories': {}, 'untouched': ['height']}
+    for key in expected_generalizations['ranges']:
+        assert (set(expected_generalizations['ranges'][key]) == set(gener['ranges'][key]))
+    for key in expected_generalizations['categories']:
+        assert (set([frozenset(sl) for sl in expected_generalizations['categories'][key]]) ==
                 set([frozenset(sl) for sl in gener['categories'][key]]))
-    assert (set(expexted_generalizations['untouched']) == set(gener['untouched']))
+    assert (set(expected_generalizations['untouched']) == set(gener['untouched']))
     assert ((np.delete(transformed, [0, 2], axis=1) == np.delete(X, [0, 2], axis=1)).all())
     modified_features = [f for f in features if
-                         f in expexted_generalizations['categories'].keys() or f in expexted_generalizations[
+                         f in expected_generalizations['categories'].keys() or f in expected_generalizations[
                              'ranges'].keys()]
     indexes = []
     for i in range(len(features)):
         if features[i] in modified_features:
             indexes.append(i)
     assert ((np.delete(transformed, indexes, axis=1) == np.delete(X, indexes, axis=1)).all())
-    ncp = gen.ncp_
-    if len(expexted_generalizations['ranges'].keys()) > 0 or len(expexted_generalizations['categories'].keys()) > 0:
+    ncp = gen.ncp
+    if len(expected_generalizations['ranges'].keys()) > 0 or len(expected_generalizations['categories'].keys()) > 0:
         assert (ncp > 0)
         assert (((transformed[indexes]) != (X[indexes])).any())
 
@@ -313,9 +319,9 @@ def test_minimizer_fit_pandas_QI(data):
     encoded = pd.DataFrame(encoded)
     base_est = DecisionTreeClassifier(random_state=0, min_samples_split=2,
                                       min_samples_leaf=1)
-    model = SklearnClassifier(base_est, ModelOutputType.CLASSIFIER_VECTOR)
+    model = SklearnClassifier(base_est, ModelOutputType.CLASSIFIER_PROBABILITIES)
     model.fit(ArrayDataset(encoded, y))
-    predictions = model.predict(encoded)
+    predictions = model.predict(ArrayDataset(encoded))
     if predictions.shape[1] > 1:
         predictions = np.argmax(predictions, axis=1)
 
@@ -326,72 +332,72 @@ def test_minimizer_fit_pandas_QI(data):
     train_dataset = ArrayDataset(X, predictions)
     gen.fit(dataset=train_dataset)
     transformed = gen.transform(dataset=ArrayDataset(X))
-    gener = gen.generalizations_
-    expexted_generalizations = {'ranges': {'age': [], 'weight': [47.0]}, 'categories': {'ola': [['bb', 'aa']]},
+    gener = gen.generalizations
+    expected_generalizations = {'ranges': {'age': [], 'weight': [47.0]}, 'categories': {'ola': [['bb', 'aa']]},
                                 'untouched': ['height', 'sex']}
 
-    for key in expexted_generalizations['ranges']:
-        assert (set(expexted_generalizations['ranges'][key]) == set(gener['ranges'][key]))
-    for key in expexted_generalizations['categories']:
-        assert (set([frozenset(sl) for sl in expexted_generalizations['categories'][key]]) ==
+    for key in expected_generalizations['ranges']:
+        assert (set(expected_generalizations['ranges'][key]) == set(gener['ranges'][key]))
+    for key in expected_generalizations['categories']:
+        assert (set([frozenset(sl) for sl in expected_generalizations['categories'][key]]) ==
                 set([frozenset(sl) for sl in gener['categories'][key]]))
-    assert (set(expexted_generalizations['untouched']) == set(gener['untouched']))
+    assert (set(expected_generalizations['untouched']) == set(gener['untouched']))
     # assert (transformed.drop(QI, axis=1).equals(X.drop(QI, axis=1)))
     np.testing.assert_array_equal(transformed.drop(QI, axis=1), X.drop(QI, axis=1))
     modified_features = [f for f in features if
-                         f in expexted_generalizations['categories'].keys() or f in expexted_generalizations[
+                         f in expected_generalizations['categories'].keys() or f in expected_generalizations[
                              'ranges'].keys()]
     # assert (transformed.drop(modified_features, axis=1).equals(X.drop(modified_features, axis=1)))
     np.testing.assert_array_equal(transformed.drop(modified_features, axis=1), X.drop(modified_features, axis=1))
-    ncp = gen.ncp_
-    if len(expexted_generalizations['ranges'].keys()) > 0 or len(expexted_generalizations['categories'].keys()) > 0:
+    ncp = gen.ncp
+    if len(expected_generalizations['ranges'].keys()) > 0 or len(expected_generalizations['categories'].keys()) > 0:
         assert (ncp > 0)
         assert (((transformed[modified_features]).equals(X[modified_features])) == False)
 
 
 def test_minimize_ndarray_iris():
     features = ['sepal length (cm)', 'sepal width (cm)', 'petal length (cm)', 'petal width (cm)']
-    (x_train, y_train), (x_test, y_test) = get_iris_dataset()
+    (x_train, y_train), (x_test, y_test) = get_iris_dataset_np()
     QI = ['sepal length (cm)', 'petal length (cm)']
     base_est = DecisionTreeClassifier(random_state=0, min_samples_split=2,
                                       min_samples_leaf=1)
-    model = SklearnClassifier(base_est, ModelOutputType.CLASSIFIER_VECTOR)
+    model = SklearnClassifier(base_est, ModelOutputType.CLASSIFIER_PROBABILITIES)
     model.fit(ArrayDataset(x_train, y_train))
-    predictions = model.predict(x_train)
+    predictions = model.predict(ArrayDataset(x_train))
     if predictions.shape[1] > 1:
         predictions = np.argmax(predictions, axis=1)
 
     gen = GeneralizeToRepresentative(model, target_accuracy=0.3, features_to_minimize=QI)
     # gen.fit(dataset=ArrayDataset(x_train, predictions))
     transformed = gen.fit_transform(dataset=ArrayDataset(x_train, predictions, features_names=features))
-    gener = gen.generalizations_
-    expexted_generalizations = {'ranges': {'sepal length (cm)': [], 'petal length (cm)': [2.449999988079071]},
+    gener = gen.generalizations
+    expected_generalizations = {'ranges': {'sepal length (cm)': [], 'petal length (cm)': [2.449999988079071]},
                                 'categories': {}, 'untouched': ['petal width (cm)', 'sepal width (cm)']}
 
-    for key in expexted_generalizations['ranges']:
-        assert (set(expexted_generalizations['ranges'][key]) == set(gener['ranges'][key]))
-    for key in expexted_generalizations['categories']:
-        assert (set([frozenset(sl) for sl in expexted_generalizations['categories'][key]]) ==
+    for key in expected_generalizations['ranges']:
+        assert (set(expected_generalizations['ranges'][key]) == set(gener['ranges'][key]))
+    for key in expected_generalizations['categories']:
+        assert (set([frozenset(sl) for sl in expected_generalizations['categories'][key]]) ==
                 set([frozenset(sl) for sl in gener['categories'][key]]))
-    assert (set(expexted_generalizations['untouched']) == set(gener['untouched']))
+    assert (set(expected_generalizations['untouched']) == set(gener['untouched']))
     assert ((np.delete(transformed, [0, 2], axis=1) == np.delete(x_train, [0, 2], axis=1)).all())
 
     modified_features = [f for f in features if
-                         f in expexted_generalizations['categories'].keys() or f in expexted_generalizations[
+                         f in expected_generalizations['categories'].keys() or f in expected_generalizations[
                              'ranges'].keys()]
     indexes = []
     for i in range(len(features)):
         if features[i] in modified_features:
             indexes.append(i)
     assert ((np.delete(transformed, indexes, axis=1) == np.delete(x_train, indexes, axis=1)).all())
-    ncp = gen.ncp_
-    if len(expexted_generalizations['ranges'].keys()) > 0 or len(expexted_generalizations['categories'].keys()) > 0:
+    ncp = gen.ncp
+    if len(expected_generalizations['ranges'].keys()) > 0 or len(expected_generalizations['categories'].keys()) > 0:
         assert (ncp > 0)
         assert (((transformed[indexes]) != (x_train[indexes])).any())
 
 
 def test_minimize_pandas_adult():
-    (x_train, y_train), (x_test, y_test) = get_adult_dataset()
+    (x_train, y_train), (x_test, y_test) = get_adult_dataset_pd()
     x_train = x_train.head(1000)
     y_train = y_train.head(1000)
 
@@ -420,9 +426,9 @@ def test_minimize_pandas_adult():
     encoded = pd.DataFrame(encoded)
     base_est = DecisionTreeClassifier(random_state=0, min_samples_split=2,
                                       min_samples_leaf=1)
-    model = SklearnClassifier(base_est, ModelOutputType.CLASSIFIER_VECTOR)
+    model = SklearnClassifier(base_est, ModelOutputType.CLASSIFIER_PROBABILITIES)
     model.fit(ArrayDataset(encoded, y_train))
-    predictions = model.predict(encoded)
+    predictions = model.predict(ArrayDataset(encoded))
     if predictions.shape[1] > 1:
         predictions = np.argmax(predictions, axis=1)
 
@@ -430,8 +436,8 @@ def test_minimize_pandas_adult():
                                      categorical_features=categorical_features, features_to_minimize=QI)
     gen.fit(dataset=ArrayDataset(x_train, predictions, features_names=features))
     transformed = gen.transform(dataset=ArrayDataset(x_train))
-    gener = gen.generalizations_
-    expexted_generalizations = {'ranges': {'age': [], 'education-num': []}, 'categories': {
+    gener = gen.generalizations
+    expected_generalizations = {'ranges': {'age': [], 'education-num': []}, 'categories': {
         'workclass': [['Self-emp-not-inc', 'Private', 'Federal-gov', 'Self-emp-inc', '?', 'Local-gov', 'State-gov']],
         'marital-status': [
             ['Divorced', 'Married-AF-spouse', 'Married-spouse-absent', 'Widowed', 'Separated', 'Married-civ-spouse',
@@ -445,28 +451,28 @@ def test_minimize_pandas_adult():
             ['Euro_1', 'LatinAmerica', 'BritishCommonwealth', 'SouthAmerica', 'UnitedStates', 'China', 'Euro_2',
              'SE_Asia', 'Other', 'Unknown']]}, 'untouched': ['capital-loss', 'hours-per-week', 'capital-gain']}
 
-    for key in expexted_generalizations['ranges']:
-        assert (set(expexted_generalizations['ranges'][key]) == set(gener['ranges'][key]))
-    for key in expexted_generalizations['categories']:
-        assert (set([frozenset(sl) for sl in expexted_generalizations['categories'][key]]) ==
+    for key in expected_generalizations['ranges']:
+        assert (set(expected_generalizations['ranges'][key]) == set(gener['ranges'][key]))
+    for key in expected_generalizations['categories']:
+        assert (set([frozenset(sl) for sl in expected_generalizations['categories'][key]]) ==
                 set([frozenset(sl) for sl in gener['categories'][key]]))
-    assert (set(expexted_generalizations['untouched']) == set(gener['untouched']))
+    assert (set(expected_generalizations['untouched']) == set(gener['untouched']))
     # assert (transformed.drop(QI, axis=1).equals(x_train.drop(QI, axis=1)))
     np.testing.assert_array_equal(transformed.drop(QI, axis=1), x_train.drop(QI, axis=1))
 
     modified_features = [f for f in features if
-                         f in expexted_generalizations['categories'].keys() or f in expexted_generalizations[
+                         f in expected_generalizations['categories'].keys() or f in expected_generalizations[
                              'ranges'].keys()]
     # assert (transformed.drop(modified_features, axis=1).equals(x_train.drop(modified_features, axis=1)))
     np.testing.assert_array_equal(transformed.drop(modified_features, axis=1), x_train.drop(modified_features, axis=1))
-    ncp = gen.ncp_
-    if len(expexted_generalizations['ranges'].keys()) > 0 or len(expexted_generalizations['categories'].keys()) > 0:
+    ncp = gen.ncp
+    if len(expected_generalizations['ranges'].keys()) > 0 or len(expected_generalizations['categories'].keys()) > 0:
         assert (ncp > 0)
         assert (((transformed[modified_features]).equals(x_train[modified_features])) == False)
 
 
 def test_german_credit_pandas():
-    (x_train, y_train), (x_test, y_test) = get_german_credit_dataset()
+    (x_train, y_train), (x_test, y_test) = get_german_credit_dataset_pd()
     features = ["Existing_checking_account", "Duration_in_month", "Credit_history", "Purpose", "Credit_amount",
                 "Savings_account", "Present_employment_since", "Installment_rate", "Personal_status_sex", "debtors",
                 "Present_residence", "Property", "Age", "Other_installment_plans", "Housing",
@@ -493,9 +499,9 @@ def test_german_credit_pandas():
     encoded = pd.DataFrame(encoded)
     base_est = DecisionTreeClassifier(random_state=0, min_samples_split=2,
                                       min_samples_leaf=1)
-    model = SklearnClassifier(base_est, ModelOutputType.CLASSIFIER_VECTOR)
+    model = SklearnClassifier(base_est, ModelOutputType.CLASSIFIER_PROBABILITIES)
     model.fit(ArrayDataset(encoded, y_train))
-    predictions = model.predict(encoded)
+    predictions = model.predict(ArrayDataset(encoded))
     if predictions.shape[1] > 1:
         predictions = np.argmax(predictions, axis=1)
 
@@ -503,8 +509,8 @@ def test_german_credit_pandas():
                                      categorical_features=categorical_features, features_to_minimize=QI)
     gen.fit(dataset=ArrayDataset(x_train, predictions))
     transformed = gen.transform(dataset=ArrayDataset(x_train))
-    gener = gen.generalizations_
-    expexted_generalizations = {'ranges': {'Duration_in_month': [31.5]},
+    gener = gen.generalizations
+    expected_generalizations = {'ranges': {'Duration_in_month': [31.5]},
                                 'categories': {'Credit_history': [['A30', 'A32', 'A31', 'A34', 'A33']], 'Purpose': [
                                     ['A41', 'A46', 'A43', 'A40', 'A44', 'A410', 'A49', 'A45', 'A48', 'A42']],
                                                'debtors': [['A101', 'A102', 'A103']],
@@ -518,22 +524,22 @@ def test_german_credit_pandas():
                                               'Age', 'Existing_checking_account', 'Credit_amount',
                                               'Present_employment_since']}
 
-    for key in expexted_generalizations['ranges']:
-        assert (set(expexted_generalizations['ranges'][key]) == set(gener['ranges'][key]))
-    for key in expexted_generalizations['categories']:
-        assert (set([frozenset(sl) for sl in expexted_generalizations['categories'][key]]) ==
+    for key in expected_generalizations['ranges']:
+        assert (set(expected_generalizations['ranges'][key]) == set(gener['ranges'][key]))
+    for key in expected_generalizations['categories']:
+        assert (set([frozenset(sl) for sl in expected_generalizations['categories'][key]]) ==
                 set([frozenset(sl) for sl in gener['categories'][key]]))
-    assert (set(expexted_generalizations['untouched']) == set(gener['untouched']))
+    assert (set(expected_generalizations['untouched']) == set(gener['untouched']))
     # assert (transformed.drop(QI, axis=1).equals(x_train.drop(QI, axis=1)))
     np.testing.assert_array_equal(transformed.drop(QI, axis=1), x_train.drop(QI, axis=1))
 
     modified_features = [f for f in features if
-                         f in expexted_generalizations['categories'].keys() or f in expexted_generalizations[
+                         f in expected_generalizations['categories'].keys() or f in expected_generalizations[
                              'ranges'].keys()]
     # assert (transformed.drop(modified_features, axis=1).equals(x_train.drop(modified_features, axis=1)))
     np.testing.assert_array_equal(transformed.drop(modified_features, axis=1), x_train.drop(modified_features, axis=1))
-    ncp = gen.ncp_
-    if len(expexted_generalizations['ranges'].keys()) > 0 or len(expexted_generalizations['categories'].keys()) > 0:
+    ncp = gen.ncp
+    if len(expected_generalizations['ranges'].keys()) > 0 or len(expected_generalizations['categories'].keys()) > 0:
         assert (ncp > 0)
         assert (((transformed[modified_features]).equals(x_train[modified_features])) == False)
 
@@ -545,7 +551,7 @@ def test_regression():
     base_est = DecisionTreeRegressor(random_state=10, min_samples_split=2)
     model = SklearnRegressor(base_est)
     model.fit(ArrayDataset(x_train, y_train))
-    predictions = model.predict(x_train)
+    predictions = model.predict(ArrayDataset(x_train))
     QI = ['age', 'bmi', 's2', 's5']
     features = ['age', 'sex', 'bmi', 'bp',
                 's1', 's2', 's3', 's4', 's5', 's6']
@@ -557,8 +563,8 @@ def test_regression():
     print('Base model accuracy (R2 score): ', model.score(ArrayDataset(x_test, y_test)))
     model.fit(ArrayDataset(transformed, y_train))
     print('Base model accuracy (R2 score) after anonymization: ', model.score(ArrayDataset(x_test, y_test)))
-    gener = gen.generalizations_
-    expexted_generalizations = {'ranges': {
+    gener = gen.generalizations
+    expected_generalizations = {'ranges': {
         'age': [-0.07816532626748085, -0.07090024650096893, -0.05637009255588055, -0.05092128552496433,
                 -0.04728874587453902, -0.04547247663140297, -0.04183994047343731, -0.027309784665703773,
                 -0.023677248042076826, -0.020044708624482155, -0.01641217083670199, -0.001882016600575298,
@@ -586,24 +592,24 @@ def test_regression():
                0.061315815430134535, 0.06272498145699501, 0.06460387445986271]}, 'categories': {},
         'untouched': ['s5', 's3', 'bp', 's1', 'sex', 's6', 's4']}
 
-    for key in expexted_generalizations['ranges']:
-        assert (set(expexted_generalizations['ranges'][key]) == set(gener['ranges'][key]))
-    for key in expexted_generalizations['categories']:
-        assert (set([frozenset(sl) for sl in expexted_generalizations['categories'][key]]) ==
+    for key in expected_generalizations['ranges']:
+        assert (set(expected_generalizations['ranges'][key]) == set(gener['ranges'][key]))
+    for key in expected_generalizations['categories']:
+        assert (set([frozenset(sl) for sl in expected_generalizations['categories'][key]]) ==
                 set([frozenset(sl) for sl in gener['categories'][key]]))
-    assert (set(expexted_generalizations['untouched']) == set(gener['untouched']))
+    assert (set(expected_generalizations['untouched']) == set(gener['untouched']))
     assert ((np.delete(transformed, [0, 2, 5, 8], axis=1) == np.delete(x_train, [0, 2, 5, 8], axis=1)).all())
 
     modified_features = [f for f in features if
-                         f in expexted_generalizations['categories'].keys() or f in expexted_generalizations[
+                         f in expected_generalizations['categories'].keys() or f in expected_generalizations[
                              'ranges'].keys()]
     indexes = []
     for i in range(len(features)):
         if features[i] in modified_features:
             indexes.append(i)
     assert ((np.delete(transformed, indexes, axis=1) == np.delete(x_train, indexes, axis=1)).all())
-    ncp = gen.ncp_
-    if len(expexted_generalizations['ranges'].keys()) > 0 or len(expexted_generalizations['categories'].keys()) > 0:
+    ncp = gen.ncp
+    if len(expected_generalizations['ranges'].keys()) > 0 or len(expected_generalizations['categories'].keys()) > 0:
         assert (ncp > 0)
         assert (((transformed[indexes]) != (x_train[indexes])).any())
 
@@ -626,34 +632,35 @@ def test_X_y(data):
     QI = [0, 2]
     base_est = DecisionTreeClassifier(random_state=0, min_samples_split=2,
                                       min_samples_leaf=1)
-    model = SklearnClassifier(base_est, ModelOutputType.CLASSIFIER_VECTOR)
+    model = SklearnClassifier(base_est, ModelOutputType.CLASSIFIER_PROBABILITIES)
     model.fit(ArrayDataset(X, y))
-    predictions = model.predict(X)
+    ad = ArrayDataset(X)
+    predictions = model.predict(ad)
     if predictions.shape[1] > 1:
         predictions = np.argmax(predictions, axis=1)
 
     gen = GeneralizeToRepresentative(model, target_accuracy=0.5, features_to_minimize=QI)
     gen.fit(X=X, y=predictions)
     transformed = gen.transform(X)
-    gener = gen.generalizations_
-    expexted_generalizations = {'ranges': {'0': [], '2': [67.5]}, 'categories': {}, 'untouched': ['1']}
-    for key in expexted_generalizations['ranges']:
-        assert (set(expexted_generalizations['ranges'][key]) == set(gener['ranges'][key]))
-    for key in expexted_generalizations['categories']:
-        assert (set([frozenset(sl) for sl in expexted_generalizations['categories'][key]]) ==
+    gener = gen.generalizations
+    expected_generalizations = {'ranges': {'0': [], '2': [67.5]}, 'categories': {}, 'untouched': ['1']}
+    for key in expected_generalizations['ranges']:
+        assert (set(expected_generalizations['ranges'][key]) == set(gener['ranges'][key]))
+    for key in expected_generalizations['categories']:
+        assert (set([frozenset(sl) for sl in expected_generalizations['categories'][key]]) ==
                 set([frozenset(sl) for sl in gener['categories'][key]]))
-    assert (set(expexted_generalizations['untouched']) == set(gener['untouched']))
+    assert (set(expected_generalizations['untouched']) == set(gener['untouched']))
     assert ((np.delete(transformed, [0, 2], axis=1) == np.delete(X, [0, 2], axis=1)).all())
     modified_features = [f for f in features if
-                         str(f) in expexted_generalizations['categories'].keys() or str(f) in expexted_generalizations[
+                         str(f) in expected_generalizations['categories'].keys() or str(f) in expected_generalizations[
                              'ranges'].keys()]
     indexes = []
     for i in range(len(features)):
         if features[i] in modified_features:
             indexes.append(i)
     assert ((np.delete(transformed, indexes, axis=1) == np.delete(X, indexes, axis=1)).all())
-    ncp = gen.ncp_
-    if len(expexted_generalizations['ranges'].keys()) > 0 or len(expexted_generalizations['categories'].keys()) > 0:
+    ncp = gen.ncp
+    if len(expected_generalizations['ranges'].keys()) > 0 or len(expected_generalizations['categories'].keys()) > 0:
         assert (ncp > 0)
         assert (((transformed[indexes]) != (X[indexes])).any())
 
@@ -676,34 +683,35 @@ def test_X_y_features_names(data):
     QI = ['age', 'weight']
     base_est = DecisionTreeClassifier(random_state=0, min_samples_split=2,
                                       min_samples_leaf=1)
-    model = SklearnClassifier(base_est, ModelOutputType.CLASSIFIER_VECTOR)
+    model = SklearnClassifier(base_est, ModelOutputType.CLASSIFIER_PROBABILITIES)
     model.fit(ArrayDataset(X, y))
-    predictions = model.predict(X)
+    ad = ArrayDataset(X)
+    predictions = model.predict(ad)
     if predictions.shape[1] > 1:
         predictions = np.argmax(predictions, axis=1)
 
     gen = GeneralizeToRepresentative(model, target_accuracy=0.5, features_to_minimize=QI)
     gen.fit(X=X, y=predictions, features_names=features)
     transformed = gen.transform(X=X, features_names=features)
-    gener = gen.generalizations_
-    expexted_generalizations = {'ranges': {'age': [], 'weight': [67.5]}, 'categories': {}, 'untouched': ['height']}
-    for key in expexted_generalizations['ranges']:
-        assert (set(expexted_generalizations['ranges'][key]) == set(gener['ranges'][key]))
-    for key in expexted_generalizations['categories']:
-        assert (set([frozenset(sl) for sl in expexted_generalizations['categories'][key]]) ==
+    gener = gen.generalizations
+    expected_generalizations = {'ranges': {'age': [], 'weight': [67.5]}, 'categories': {}, 'untouched': ['height']}
+    for key in expected_generalizations['ranges']:
+        assert (set(expected_generalizations['ranges'][key]) == set(gener['ranges'][key]))
+    for key in expected_generalizations['categories']:
+        assert (set([frozenset(sl) for sl in expected_generalizations['categories'][key]]) ==
                 set([frozenset(sl) for sl in gener['categories'][key]]))
-    assert (set(expexted_generalizations['untouched']) == set(gener['untouched']))
+    assert (set(expected_generalizations['untouched']) == set(gener['untouched']))
     assert ((np.delete(transformed, [0, 2], axis=1) == np.delete(X, [0, 2], axis=1)).all())
     modified_features = [f for f in features if
-                         f in expexted_generalizations['categories'].keys() or f in expexted_generalizations[
+                         f in expected_generalizations['categories'].keys() or f in expected_generalizations[
                              'ranges'].keys()]
     indexes = []
     for i in range(len(features)):
         if features[i] in modified_features:
             indexes.append(i)
     assert ((np.delete(transformed, indexes, axis=1) == np.delete(X, indexes, axis=1)).all())
-    ncp = gen.ncp_
-    if len(expexted_generalizations['ranges'].keys()) > 0 or len(expexted_generalizations['categories'].keys()) > 0:
+    ncp = gen.ncp
+    if len(expected_generalizations['ranges'].keys()) > 0 or len(expected_generalizations['categories'].keys()) > 0:
         assert (ncp > 0)
         assert (((transformed[indexes]) != (X[indexes])).any())
 
@@ -755,25 +763,25 @@ def test_BaseEstimator_classification(data):
     train_dataset = ArrayDataset(X, predictions)
     gen.fit(dataset=train_dataset)
     transformed = gen.transform(dataset=ArrayDataset(X))
-    gener = gen.generalizations_
-    expexted_generalizations = {'ranges': {'age': [], 'weight': [47.0]}, 'categories': {'ola': [['bb', 'aa']]},
+    gener = gen.generalizations
+    expected_generalizations = {'ranges': {'age': [], 'weight': [47.0]}, 'categories': {'ola': [['bb', 'aa']]},
                                 'untouched': ['height', 'sex']}
 
-    for key in expexted_generalizations['ranges']:
-        assert (set(expexted_generalizations['ranges'][key]) == set(gener['ranges'][key]))
-    for key in expexted_generalizations['categories']:
-        assert (set([frozenset(sl) for sl in expexted_generalizations['categories'][key]]) ==
+    for key in expected_generalizations['ranges']:
+        assert (set(expected_generalizations['ranges'][key]) == set(gener['ranges'][key]))
+    for key in expected_generalizations['categories']:
+        assert (set([frozenset(sl) for sl in expected_generalizations['categories'][key]]) ==
                 set([frozenset(sl) for sl in gener['categories'][key]]))
-    assert (set(expexted_generalizations['untouched']) == set(gener['untouched']))
+    assert (set(expected_generalizations['untouched']) == set(gener['untouched']))
     # assert (transformed.drop(QI, axis=1).equals(X.drop(QI, axis=1)))
     np.testing.assert_array_equal(transformed.drop(QI, axis=1), X.drop(QI, axis=1))
     modified_features = [f for f in features if
-                         f in expexted_generalizations['categories'].keys() or f in expexted_generalizations[
+                         f in expected_generalizations['categories'].keys() or f in expected_generalizations[
                              'ranges'].keys()]
     # assert (transformed.drop(modified_features, axis=1).equals(X.drop(modified_features, axis=1)))
     np.testing.assert_array_equal(transformed.drop(modified_features, axis=1), X.drop(modified_features, axis=1))
-    ncp = gen.ncp_
-    if len(expexted_generalizations['ranges'].keys()) > 0 or len(expexted_generalizations['categories'].keys()) > 0:
+    ncp = gen.ncp
+    if len(expected_generalizations['ranges'].keys()) > 0 or len(expected_generalizations['categories'].keys()) > 0:
         assert (ncp > 0)
         assert (((transformed[modified_features]).equals(X[modified_features])) == False)
 
@@ -797,8 +805,8 @@ def test_BaseEstimator_regression():
     print('Base model accuracy (R2 score): ', model.score(x_test, y_test))
     model.fit(transformed, y_train)
     print('Base model accuracy (R2 score) after minimization: ', model.score(x_test, y_test))
-    gener = gen.generalizations_
-    expexted_generalizations = {'ranges': {
+    gener = gen.generalizations
+    expected_generalizations = {'ranges': {
         'age': [-0.07816532626748085, -0.07090024650096893, -0.05637009255588055, -0.05092128552496433,
                 -0.04728874587453902, -0.04547247663140297, -0.04183994047343731, -0.027309784665703773,
                 -0.023677248042076826, -0.020044708624482155, -0.01641217083670199, -0.001882016600575298,
@@ -826,23 +834,106 @@ def test_BaseEstimator_regression():
                0.061315815430134535, 0.06272498145699501, 0.06460387445986271]}, 'categories': {},
         'untouched': ['s5', 's3', 'bp', 's1', 'sex', 's6', 's4']}
 
-    for key in expexted_generalizations['ranges']:
-        assert (set(expexted_generalizations['ranges'][key]) == set(gener['ranges'][key]))
-    for key in expexted_generalizations['categories']:
-        assert (set([frozenset(sl) for sl in expexted_generalizations['categories'][key]]) ==
+    for key in expected_generalizations['ranges']:
+        assert (set(expected_generalizations['ranges'][key]) == set(gener['ranges'][key]))
+    for key in expected_generalizations['categories']:
+        assert (set([frozenset(sl) for sl in expected_generalizations['categories'][key]]) ==
                 set([frozenset(sl) for sl in gener['categories'][key]]))
-    assert (set(expexted_generalizations['untouched']) == set(gener['untouched']))
+    assert (set(expected_generalizations['untouched']) == set(gener['untouched']))
     assert ((np.delete(transformed, [0, 2, 5, 8], axis=1) == np.delete(x_train, [0, 2, 5, 8], axis=1)).all())
 
     modified_features = [f for f in features if
-                         f in expexted_generalizations['categories'].keys() or f in expexted_generalizations[
+                         f in expected_generalizations['categories'].keys() or f in expected_generalizations[
                              'ranges'].keys()]
     indexes = []
     for i in range(len(features)):
         if features[i] in modified_features:
             indexes.append(i)
     assert ((np.delete(transformed, indexes, axis=1) == np.delete(x_train, indexes, axis=1)).all())
-    ncp = gen.ncp_
-    if len(expexted_generalizations['ranges'].keys()) > 0 or len(expexted_generalizations['categories'].keys()) > 0:
+    ncp = gen.ncp
+    if len(expected_generalizations['ranges'].keys()) > 0 or len(expected_generalizations['categories'].keys()) > 0:
         assert (ncp > 0)
         assert (((transformed[indexes]) != (x_train[indexes])).any())
+
+
+def test_keras_model():
+    (X, y), (x_test, y_test) = get_iris_dataset_np()
+
+    base_est = Sequential()
+    base_est.add(Input(shape=(4,)))
+    base_est.add(Dense(10, activation="relu"))
+    base_est.add(Dense(3, activation='softmax'))
+
+    base_est.compile(loss="categorical_crossentropy", optimizer="adam", metrics=["accuracy"])
+
+    model = KerasClassifier(base_est, ModelOutputType.CLASSIFIER_PROBABILITIES)
+    model.fit(ArrayDataset(X, y))
+    ad = ArrayDataset(x_test)
+    predictions = model.predict(ad)
+    if predictions.shape[1] > 1:
+        predictions = np.argmax(predictions, axis=1)
+
+    gen = GeneralizeToRepresentative(model, target_accuracy=0.5)
+    test_dataset = ArrayDataset(x_test, predictions)
+
+    gen.fit(dataset=test_dataset)
+    transformed = gen.transform(dataset=ad)
+    gener = gen.generalizations
+
+    features = ['0', '1', '2', '3']
+    modified_features = [f for f in features if
+                         f in gener['categories'].keys() or f in gener['ranges'].keys()]
+    indexes = []
+    for i in range(len(features)):
+        if features[i] in modified_features:
+            indexes.append(i)
+    assert ((np.delete(transformed, indexes, axis=1) == np.delete(x_test, indexes, axis=1)).all())
+    ncp = gen.ncp
+    if len(gener['ranges'].keys()) > 0 or len(gener['categories'].keys()) > 0:
+        assert (ncp > 0)
+        assert (((transformed[indexes]) != (X[indexes])).any())
+
+
+def test_blackbox_model():
+    (X, y), (x_test, y_test) = get_iris_dataset_np()
+    train_data = ArrayDataset(X, y)
+    test_data = ArrayDataset(x_test, y_test)
+    data = Data(train_data, test_data)
+
+    model = BlackboxClassifier(data, ModelOutputType.CLASSIFIER_PROBABILITIES)
+    ad = ArrayDataset(x_test)
+    predictions = model.predict(ad)
+    if predictions.shape[1] > 1:
+        predictions = np.argmax(predictions, axis=1)
+
+    gen = GeneralizeToRepresentative(model, target_accuracy=0.5)
+    train_dataset = ArrayDataset(x_test, predictions)
+
+    gen.fit(dataset=train_dataset)
+    transformed = gen.transform(dataset=ad)
+    gener = gen.generalizations
+    expected_generalizations = {'ranges': {'0': [], '1': [], '2': [4.849999904632568, 5.049999952316284],
+                                           '3': [0.7000000029802322, 1.600000023841858]},
+                                'categories': {},
+                                'untouched': []}
+
+    for key in expected_generalizations['ranges']:
+        assert (set(expected_generalizations['ranges'][key]) == set(gener['ranges'][key]))
+    for key in expected_generalizations['categories']:
+        assert (set([frozenset(sl) for sl in expected_generalizations['categories'][key]]) ==
+                set([frozenset(sl) for sl in gener['categories'][key]]))
+    assert (set(expected_generalizations['untouched']) == set(gener['untouched']))
+
+    features = ['0', '1', '2', '3']
+    modified_features = [f for f in features if
+                         f in expected_generalizations['categories'].keys() or f in expected_generalizations[
+                             'ranges'].keys()]
+    indexes = []
+    for i in range(len(features)):
+        if features[i] in modified_features:
+            indexes.append(i)
+    assert ((np.delete(transformed, indexes, axis=1) == np.delete(x_test, indexes, axis=1)).all())
+    ncp = gen.ncp
+    if len(expected_generalizations['ranges'].keys()) > 0 or len(expected_generalizations['categories'].keys()) > 0:
+        assert (ncp > 0)
+        assert (((transformed[indexes]) != (X[indexes])).any())
diff --git a/tests/test_model.py b/tests/test_model.py
index bbb951b..4470658 100644
--- a/tests/test_model.py
+++ b/tests/test_model.py
@@ -1,21 +1,24 @@
 import pytest
 
-from apt.utils.models import SklearnClassifier, SklearnRegressor, ModelOutputType
-from apt.utils.datasets import ArrayDataset
+from apt.utils.models import SklearnClassifier, SklearnRegressor, ModelOutputType, KerasClassifier, BlackboxClassifier
+from apt.utils.datasets import ArrayDataset, Data
 from apt.utils import dataset_utils
 
 from sklearn.tree import DecisionTreeRegressor
 from sklearn.ensemble import RandomForestClassifier
 
+from tensorflow.keras.models import Sequential
+from tensorflow.keras.layers import Dense, Input
+
 
 def test_sklearn_classifier():
-    (x_train, y_train), (x_test, y_test) = dataset_utils.get_iris_dataset()
+    (x_train, y_train), (x_test, y_test) = dataset_utils.get_iris_dataset_np()
     underlying_model = RandomForestClassifier()
-    model = SklearnClassifier(underlying_model, ModelOutputType.CLASSIFIER_VECTOR)
+    model = SklearnClassifier(underlying_model, ModelOutputType.CLASSIFIER_PROBABILITIES)
     train = ArrayDataset(x_train, y_train)
     test = ArrayDataset(x_test, y_test)
     model.fit(train)
-    pred = model.predict(x_test)
+    pred = model.predict(test)
     assert(pred.shape[0] == x_test.shape[0])
 
     score = model.score(test)
@@ -23,13 +26,50 @@ def test_sklearn_classifier():
 
 
 def test_sklearn_regressor():
-    (x_train, y_train), (x_test, y_test) = dataset_utils.get_diabetes_dataset()
+    (x_train, y_train), (x_test, y_test) = dataset_utils.get_diabetes_dataset_np()
     underlying_model = DecisionTreeRegressor()
     model = SklearnRegressor(underlying_model)
     train = ArrayDataset(x_train, y_train)
     test = ArrayDataset(x_test, y_test)
     model.fit(train)
-    pred = model.predict(x_test)
+    pred = model.predict(test)
     assert (pred.shape[0] == x_test.shape[0])
 
     score = model.score(test)
+
+
+def test_keras_classifier():
+    (x_train, y_train), (x_test, y_test) = dataset_utils.get_iris_dataset_np()
+
+    underlying_model = Sequential()
+    underlying_model.add(Input(shape=(4,)))
+    underlying_model.add(Dense(100, activation="relu"))
+    underlying_model.add(Dense(10, activation="relu"))
+    underlying_model.add(Dense(3, activation='softmax'))
+
+    underlying_model.compile(loss="categorical_crossentropy", optimizer="adam", metrics=["accuracy"])
+
+    model = KerasClassifier(underlying_model, ModelOutputType.CLASSIFIER_PROBABILITIES)
+
+    train = ArrayDataset(x_train, y_train)
+    test = ArrayDataset(x_test, y_test)
+    model.fit(train)
+    pred = model.predict(test)
+    assert(pred.shape[0] == x_test.shape[0])
+
+    score = model.score(test)
+    assert(0.0 <= score <= 1.0)
+
+
+def test_blackbox_classifier():
+    (x_train, y_train), (x_test, y_test) = dataset_utils.get_iris_dataset_np()
+
+    train = ArrayDataset(x_train, y_train)
+    test = ArrayDataset(x_test, y_test)
+    data = Data(train, test)
+    model = BlackboxClassifier(data, ModelOutputType.CLASSIFIER_PROBABILITIES)
+    pred = model.predict(test)
+    assert(pred.shape[0] == x_test.shape[0])
+
+    score = model.score(test)
+    assert(0.0 <= score <= 1.0)

From 186f11eaaf9238dfaa469c128d3e33fe4133f7f2 Mon Sep 17 00:00:00 2001
From: abigailt <abigailt@il.ibm.com>
Date: Thu, 19 May 2022 16:41:31 +0300
Subject: [PATCH 10/26] Fix misclassification of categorical features with no
 generalizations (now appear under the 'untouched' category)

---
 apt/minimization/minimizer.py | 21 ++++++++++++++++++---
 tests/test_minimizer.py       | 22 ++++++++++++++++++++++
 2 files changed, 40 insertions(+), 3 deletions(-)

diff --git a/apt/minimization/minimizer.py b/apt/minimization/minimizer.py
index df70a3a..ebac318 100644
--- a/apt/minimization/minimizer.py
+++ b/apt/minimization/minimizer.py
@@ -62,9 +62,9 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
                  cells: Optional[list] = None, categorical_features: Optional[Union[np.ndarray, list]] = None,
                  features_to_minimize: Optional[Union[np.ndarray, list]] = None, train_only_QI: Optional[bool] = True,
                  is_regression: Optional[bool] = False):
-        if issubclass(estimator.__class__, Model):
-            self.estimator = estimator
-        else:
+
+        self.estimator = estimator
+        if estimator is not None and not issubclass(estimator.__class__, Model):
             if is_regression:
                 self.estimator = SklearnRegressor(estimator)
             else:
@@ -832,6 +832,7 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
         self._generalizations = {'ranges': GeneralizeToRepresentative._calculate_ranges(self.cells),
                                  'categories': GeneralizeToRepresentative._calculate_categories(self.cells),
                                  'untouched': GeneralizeToRepresentative._calculate_untouched(self.cells)}
+        self._remove_categorical_untouched(self._generalizations)
 
     def _find_range_count(self, samples, ranges):
         samples_df = pd.DataFrame(samples, columns=self._categorical_data.columns)
@@ -988,3 +989,17 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
                 del cell['categories'][feature]
             cell['untouched'].append(feature)
             cells_by_id[cell['id']] = cell.copy()
+
+    @staticmethod
+    def _remove_categorical_untouched(generalizations):
+        to_remove = []
+        for feature in generalizations['categories'].keys():
+            category_sizes = [len(g) if len(g) > 1 else 0 for g in generalizations['categories'][feature]]
+            if sum(category_sizes) == 0:
+                if 'untouched' not in generalizations:
+                    generalizations['untouched'] = []
+                generalizations['untouched'].append(feature)
+                to_remove.append(feature)
+
+        for feature in to_remove:
+            del generalizations['categories'][feature]
diff --git a/tests/test_minimizer.py b/tests/test_minimizer.py
index 181755b..6adad90 100644
--- a/tests/test_minimizer.py
+++ b/tests/test_minimizer.py
@@ -937,3 +937,25 @@ def test_blackbox_model():
     if len(expected_generalizations['ranges'].keys()) > 0 or len(expected_generalizations['categories'].keys()) > 0:
         assert (ncp > 0)
         assert (((transformed[indexes]) != (X[indexes])).any())
+
+
+def test_untouched():
+    cells = [{"id": 1, "ranges": {"age": {"start": None, "end": 38}}, "label": 0,
+              'categories': {'gender': ['male']}, "representative": {"age": 26, "height": 149}},
+             {"id": 2, "ranges": {"age": {"start": 39, "end": None}}, "label": 1,
+              'categories': {'gender': ['female']}, "representative": {"age": 58, "height": 163}},
+             {"id": 3, "ranges": {"age": {"start": None, "end": 38}}, "label": 0,
+              'categories': {'gender': ['male']}, "representative": {"age": 31, "height": 184}},
+             {"id": 4, "ranges": {"age": {"start": 39, "end": None}}, "label": 1,
+              'categories': {'gender': ['male', 'female']}, "representative": {"age": 45, "height": 176}}
+             ]
+    gen = GeneralizeToRepresentative(cells=cells)
+    gen._calculate_generalizations()
+    gener = gen.generalizations
+    expected_generalizations = {'ranges': {'age': [38, 39]}, 'categories': {}, 'untouched': ['gender']}
+    for key in expected_generalizations['ranges']:
+        assert (set(expected_generalizations['ranges'][key]) == set(gener['ranges'][key]))
+    for key in expected_generalizations['categories']:
+        assert (set([frozenset(sl) for sl in expected_generalizations['categories'][key]]) ==
+                set([frozenset(sl) for sl in gener['categories'][key]]))
+    assert (set(expected_generalizations['untouched']) == set(gener['untouched']))

From 7055d5ecf6e89290a56ca3aa5eca307b45a6a783 Mon Sep 17 00:00:00 2001
From: abigailt <abigailt@il.ibm.com>
Date: Thu, 19 May 2022 17:49:59 +0300
Subject: [PATCH 11/26] Fix bug in pruning loop + fix test

---
 apt/minimization/minimizer.py | 47 +++++++++++++++++++----------------
 tests/test_minimizer.py       |  7 +++---
 2 files changed, 29 insertions(+), 25 deletions(-)

diff --git a/apt/minimization/minimizer.py b/apt/minimization/minimizer.py
index ebac318..c975fdb 100644
--- a/apt/minimization/minimizer.py
+++ b/apt/minimization/minimizer.py
@@ -324,31 +324,34 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
                 print('Improving generalizations')
                 level = 1
                 while accuracy > self.target_accuracy:
-                    try:
-                        cells_previous_iter = self.cells
-                        generalization_prev_iter = self._generalizations
-                        cells_by_id_prev = self._cells_by_id
-                        nodes = self._get_nodes_level(level)
-                        self._calculate_level_cells(level)
-                        self._attach_cells_representatives(x_prepared, used_X_train, y_train, nodes)
+                    cells_previous_iter = self.cells
+                    generalization_prev_iter = self._generalizations
+                    cells_by_id_prev = self._cells_by_id
+                    nodes = self._get_nodes_level(level)
 
-                        self._calculate_generalizations()
-                        generalized = self._generalize(X_test, x_prepared_test, nodes, self.cells,
-                                                       self._cells_by_id)
-                        accuracy = self.estimator.score(ArrayDataset(preprocessor.transform(generalized), y_test))
-                        # if accuracy passed threshold roll back to previous iteration generalizations
-                        if accuracy < self.target_accuracy:
-                            self.cells = cells_previous_iter
-                            self._generalizations = generalization_prev_iter
-                            self._cells_by_id = cells_by_id_prev
-                            break
-                        else:
-                            print('Pruned tree to level: %d, new relative accuracy: %f' % (level, accuracy))
-                            level += 1
-                    except Exception as e:
+                    try:
+                        self._calculate_level_cells(level)
+                    except TypeError as e:
                         print(e)
                         break
 
+                    self._attach_cells_representatives(x_prepared, used_X_train, y_train, nodes)
+
+                    self._calculate_generalizations()
+                    generalized = self._generalize(X_test, x_prepared_test, nodes, self.cells,
+                                                   self._cells_by_id)
+                    accuracy = self.estimator.score(ArrayDataset(preprocessor.transform(generalized), y_test))
+                    # if accuracy passed threshold roll back to previous iteration generalizations
+                    if accuracy < self.target_accuracy:
+                        self.cells = cells_previous_iter
+                        self._generalizations = generalization_prev_iter
+                        self._cells_by_id = cells_by_id_prev
+                        break
+                    else:
+                        print('Pruned tree to level: %d, new relative accuracy: %f' % (level, accuracy))
+                        level += 1
+
+
             # if accuracy below threshold, improve accuracy by removing features from generalization
             elif accuracy < self.target_accuracy:
                 print('Improving accuracy')
@@ -569,7 +572,7 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
         features = self._categorical_data.columns
         for cell in self.cells:
             new_cell = {'id': cell['id'], 'label': cell['label'], 'ranges': {}, 'categories': {}, 'hist': cell['hist'],
-                        'representative': None}
+                        'untouched': [], 'representative': None}
             for feature in features:
                 if feature in self._one_hot_vector_features_to_features.keys():
                     # feature is categorical and should be mapped
diff --git a/tests/test_minimizer.py b/tests/test_minimizer.py
index 6adad90..dca3ebd 100644
--- a/tests/test_minimizer.py
+++ b/tests/test_minimizer.py
@@ -1,6 +1,8 @@
 import pytest
 import numpy as np
 import pandas as pd
+from numpy.testing import assert_almost_equal
+
 from sklearn.compose import ColumnTransformer
 
 from sklearn.datasets import load_boston, load_diabetes
@@ -912,13 +914,12 @@ def test_blackbox_model():
     gen.fit(dataset=train_dataset)
     transformed = gen.transform(dataset=ad)
     gener = gen.generalizations
-    expected_generalizations = {'ranges': {'0': [], '1': [], '2': [4.849999904632568, 5.049999952316284],
-                                           '3': [0.7000000029802322, 1.600000023841858]},
+    expected_generalizations = {'ranges': {'0': [], '1': [], '2': [4.849999904632568], '3': [0.7000000029802322]},
                                 'categories': {},
                                 'untouched': []}
 
     for key in expected_generalizations['ranges']:
-        assert (set(expected_generalizations['ranges'][key]) == set(gener['ranges'][key]))
+        assert_almost_equal(expected_generalizations['ranges'][key], gener['ranges'][key])
     for key in expected_generalizations['categories']:
         assert (set([frozenset(sl) for sl in expected_generalizations['categories'][key]]) ==
                 set([frozenset(sl) for sl in gener['categories'][key]]))

From dfa684da6bec83d87d31cc58f162d3d0915664ba Mon Sep 17 00:00:00 2001
From: abigailgold <57357634+abigailgold@users.noreply.github.com>
Date: Sun, 22 May 2022 18:02:33 +0300
Subject: [PATCH 12/26] Consistent one-hot-encoding (#38)

* Reuse code between generalize and transform methods

* Option to get encoder from user

* Consistent encoding for decision tree and generalizations (separate from target model encoding)
---
 apt/minimization/minimizer.py | 181 +++++++++++++++-------------------
 tests/test_minimizer.py       | 100 ++++++++++++++-----
 2 files changed, 153 insertions(+), 128 deletions(-)

diff --git a/apt/minimization/minimizer.py b/apt/minimization/minimizer.py
index c975fdb..79983f7 100644
--- a/apt/minimization/minimizer.py
+++ b/apt/minimization/minimizer.py
@@ -11,7 +11,7 @@ from sklearn.base import BaseEstimator, TransformerMixin, MetaEstimatorMixin
 from sklearn.compose import ColumnTransformer
 from sklearn.impute import SimpleImputer
 from sklearn.pipeline import Pipeline
-from sklearn.preprocessing import OneHotEncoder
+from sklearn.preprocessing import OneHotEncoder, OrdinalEncoder
 from sklearn.utils.validation import check_is_fitted
 from sklearn.tree import DecisionTreeClassifier, DecisionTreeRegressor
 from sklearn.model_selection import train_test_split
@@ -47,12 +47,15 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
     :type cells: list of objects, optional
     :param categorical_features: The list of categorical features (if supplied, these featurtes will be one-hot
                                  encoded before using them to train the decision tree model).
+    :param encoder: Optional encoder for encoding data before feeding it into the estimator (e.g., for categorical
+                    features)
+    :type encoder: sklearn OrdinalEncoder or OneHotEncoder
     :type categorical_features: list of strings, optional
     :param features_to_minimize: The features to be minimized.
     :type features_to_minimize: list of strings or int, optional
-    :param train_only_QI: Whether to train the tree just on the ``features_to_minimize`` or on all features. Default
-                          is only on ``features_to_minimize``.
-    :type train_only_QI: boolean, optional
+    :param train_only_features_to_minimize: Whether to train the tree just on the ``features_to_minimize`` or on all
+                                            features. Default is only on ``features_to_minimize``.
+    :type train_only_features_to_minimize: boolean, optional
     :param is_regression: Whether the model is a regression model or not (if False, assumes a classification model).
                           Default is False.
     :type is_regression: boolean, optional
@@ -60,7 +63,9 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
 
     def __init__(self, estimator: Union[BaseEstimator, Model] = None, target_accuracy: Optional[float] = 0.998,
                  cells: Optional[list] = None, categorical_features: Optional[Union[np.ndarray, list]] = None,
-                 features_to_minimize: Optional[Union[np.ndarray, list]] = None, train_only_QI: Optional[bool] = True,
+                 encoder: Optional[Union[OrdinalEncoder, OneHotEncoder]] = None,
+                 features_to_minimize: Optional[Union[np.ndarray, list]] = None,
+                 train_only_features_to_minimize: Optional[bool] = True,
                  is_regression: Optional[bool] = False):
 
         self.estimator = estimator
@@ -75,8 +80,9 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
         if categorical_features:
             self.categorical_features = categorical_features
         self.features_to_minimize = features_to_minimize
-        self.train_only_QI = train_only_QI
+        self.train_only_features_to_minimize = train_only_features_to_minimize
         self.is_regression = is_regression
+        self.encoder = encoder
 
     def get_params(self, deep=True):
         """
@@ -89,9 +95,14 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
         """
         ret = {}
         ret['target_accuracy'] = self.target_accuracy
+        ret['categorical_features'] = self.categorical_features
+        ret['features_to_minimize'] = self.features_to_minimize
+        ret['train_only_features_to_minimize'] = self.train_only_features_to_minimize
+        ret['is_regression'] = self.is_regression
         if deep:
             ret['cells'] = copy.deepcopy(self.cells)
             ret['estimator'] = self.estimator
+            ret['encoder'] = self.encoder
         else:
             ret['cells'] = copy.copy(self.cells)
         return ret
@@ -111,6 +122,14 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
         """
         if 'target_accuracy' in params:
             self.target_accuracy = params['target_accuracy']
+        if 'categorical_features' in params:
+            self.categorical_features = params['categorical_features']
+        if 'features_to_minimize' in params:
+            self.features_to_minimize = params['features_to_minimize']
+        if 'train_only_features_to_minimize' in params:
+            self.train_only_features_to_minimize = params['train_only_features_to_minimize']
+        if 'is_regression' in params:
+            self.is_regression = params['is_regression']
         if 'cells' in params:
             self.cells = params['cells']
         return self
@@ -208,7 +227,7 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
 
             # divide dataset into train and test
             used_data = x
-            if self.train_only_QI:
+            if self.train_only_features_to_minimize:
                 used_data = x_QI
             if self.is_regression:
                 X_train, X_test, y_train, y_test = train_test_split(x, dataset.get_labels(), test_size=0.4, random_state=14)
@@ -219,8 +238,10 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
             X_train_QI = X_train.loc[:, self.features_to_minimize]
             X_test_QI = X_test.loc[:, self.features_to_minimize]
             used_X_train = X_train
-            if self.train_only_QI:
+            used_X_test = X_test
+            if self.train_only_features_to_minimize:
                 used_X_train = X_train_QI
+                used_X_test = X_test_QI
 
             # collect feature data (such as min, max)
             feature_data = {}
@@ -236,46 +257,20 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
                         fd['range'] = len(np.unique(values))
                     feature_data[feature] = fd
 
-            # prepare data for DT
-
-            # preprocessor to fit data that have features not included in QI (to get accuracy)
-            numeric_features = [f for f in self._features if f not in self.categorical_features]
-            numeric_transformer = Pipeline(
-                steps=[('imputer', SimpleImputer(strategy='constant', fill_value=0))]
-            )
-            categorical_transformer = OneHotEncoder(handle_unknown="ignore", sparse=False)
-            preprocessor = ColumnTransformer(
-                transformers=[
-                    ("num", numeric_transformer, numeric_features),
-                    ("cat", categorical_transformer, self.categorical_features),
-                ]
-            )
-            preprocessor.fit(x)
-
-            if self.train_only_QI:
-                categorical_features = [f for f in self._features if f in self.categorical_features and
-                                        f in self.features_to_minimize]
-
+            # default encoder in case none provided
+            if self.encoder is None:
+                numeric_features = [f for f in self._features if f not in self.categorical_features]
                 numeric_transformer = Pipeline(
                         steps=[('imputer', SimpleImputer(strategy='constant', fill_value=0))]
                 )
-
-                numeric_features = [f for f in self._features if f not in self.categorical_features and
-                                    f in self.features_to_minimize]
                 categorical_transformer = OneHotEncoder(handle_unknown="ignore", sparse=False)
-
-                preprocessor_QI_features = ColumnTransformer(
+                self.encoder = ColumnTransformer(
                         transformers=[
                             ("num", numeric_transformer, numeric_features),
-                            ("cat", categorical_transformer, categorical_features),
+                            ("cat", categorical_transformer, self.categorical_features),
                         ]
                 )
-                preprocessor_QI_features.fit(x_QI)
-                x_prepared = preprocessor_QI_features.transform(X_train_QI)
-            else:
-                x_prepared = preprocessor.transform(X_train)
-
-            self._preprocessor = preprocessor
+                self.encoder.fit(x)
 
             self.cells = []
             self._categorical_values = {}
@@ -285,11 +280,12 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
             else:
                 self._dt = DecisionTreeClassifier(random_state=0, min_samples_split=2,
                                                   min_samples_leaf=1)
+
+            # prepare data for DT
+            self._encode_categorical_features(used_data, save_mapping=True)
+            x_prepared = self._encode_categorical_features(used_X_train)
             self._dt.fit(x_prepared, y_train)
-
-            self._modify_categorical_features(used_data)
-
-            x_prepared = pd.DataFrame(x_prepared, columns=self._categorical_data.columns)
+            x_prepared_test = self._encode_categorical_features(used_X_test)
 
             self._calculate_cells()
             self._modify_cells()
@@ -303,19 +299,10 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
 
             # self._cells currently holds the generalization created from the tree leaves
             self._calculate_generalizations()
-
-            # apply generalizations to test data
-            if self.train_only_QI:
-                x_prepared_test = preprocessor_QI_features.transform(X_test_QI)
-            else:
-                x_prepared_test = preprocessor.transform(X_test)
-
-            x_prepared_test = pd.DataFrame(x_prepared_test, index=X_test.index, columns=self._categorical_data.columns)
-
             generalized = self._generalize(X_test, x_prepared_test, nodes, self.cells, self._cells_by_id)
 
             # check accuracy
-            accuracy = self.estimator.score(ArrayDataset(preprocessor.transform(generalized), y_test))
+            accuracy = self.estimator.score(ArrayDataset(self.encoder.transform(generalized), y_test))
             print('Initial accuracy of model on generalized data, relative to original model predictions '
                   '(base generalization derived from tree, before improvements): %f' % accuracy)
 
@@ -340,7 +327,7 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
                     self._calculate_generalizations()
                     generalized = self._generalize(X_test, x_prepared_test, nodes, self.cells,
                                                    self._cells_by_id)
-                    accuracy = self.estimator.score(ArrayDataset(preprocessor.transform(generalized), y_test))
+                    accuracy = self.estimator.score(ArrayDataset(self.encoder.transform(generalized), y_test))
                     # if accuracy passed threshold roll back to previous iteration generalizations
                     if accuracy < self.target_accuracy:
                         self.cells = cells_previous_iter
@@ -364,7 +351,7 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
 
                     self._calculate_generalizations()
                     generalized = self._generalize(X_test, x_prepared_test, nodes, self.cells, self._cells_by_id)
-                    accuracy = self.estimator.score(ArrayDataset(preprocessor.transform(generalized), y_test))
+                    accuracy = self.estimator.score(ArrayDataset(self.encoder.transform(generalized), y_test))
                     print('Removed feature: %s, new relative accuracy: %f' % (removed_feature, accuracy))
 
             # self._cells currently holds the chosen generalization based on target accuracy
@@ -416,38 +403,13 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
         if not self._features:
             self._features = [i for i in range(x.shape[1])]
 
-        representatives = pd.DataFrame(columns=self._features)  # only columns
-        generalized = pd.DataFrame(x, columns=self._features, copy=True)  # original data
         mapped = np.zeros(x.shape[0])  # to mark records we already mapped
-
-        # iterate over cells (leaves in decision tree)
+        all_indexes = []
         for i in range(len(self.cells)):
-            # Copy the representatives from the cells into another data structure:
-            # iterate over features in test data
-            for feature in self._features:
-                # if feature has a representative value in the cell and should not
-                # be left untouched, take the representative value
-                if feature in self.cells[i]['representative'] and \
-                        ('untouched' not in self.cells[i]
-                         or feature not in self.cells[i]['untouched']):
-                    representatives.loc[i, feature] = self.cells[i]['representative'][feature]
-                # else, drop the feature (removes from representatives columns that
-                # do not have a representative value or should remain untouched)
-                elif feature in representatives.columns.tolist():
-                    representatives = representatives.drop(feature, axis=1)
-
-            # get the indexes of all records that map to this cell
             indexes = self._get_record_indexes_for_cell(x, self.cells[i], mapped)
+            all_indexes.append(indexes)
+        generalized = self._generalize_indexes(x, self.cells, all_indexes)
 
-            # replace the values in the representative columns with the representative
-            # values (leaves others untouched)
-            if indexes and not representatives.columns.empty:
-                if len(indexes) > 1:
-                    replace = pd.concat([representatives.loc[i].to_frame().T] * len(indexes)).reset_index(drop=True)
-                else:
-                    replace = representatives.loc[i].to_frame().T.reset_index(drop=True)
-                replace.index = indexes
-                generalized.loc[indexes, representatives.columns] = replace
         if dataset and dataset.is_pandas:
             return generalized
         elif isinstance(X, pd.DataFrame):
@@ -477,29 +439,36 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
         mapped.itemset(i, 1)
         return True
 
-    def _modify_categorical_features(self, X):
-        self._categorical_values = {}
-        self._one_hot_vector_features_to_features = {}
+    def _encode_categorical_features(self, X, save_mapping=False):
+        if save_mapping:
+            self._categorical_values = {}
+            self._one_hot_vector_features_to_features = {}
         features_to_remove = []
         used_features = self._features
-        if self.train_only_QI:
+        if self.train_only_features_to_minimize:
             used_features = self.features_to_minimize
         for feature in self.categorical_features:
             if feature in used_features:
                 try:
                     all_values = X.loc[:, feature]
                     values = list(all_values.unique())
-                    self._categorical_values[feature] = values
-                    X[feature] = pd.Categorical(X.loc[:, feature], categories=values, ordered=False)
+                    if save_mapping:
+                        self._categorical_values[feature] = values
+                    X[feature] = pd.Categorical(X.loc[:, feature], categories=self._categorical_values[feature],
+                                                ordered=False)
                     ohe = pd.get_dummies(X[feature], prefix=feature)
-                    for one_hot_vector_feature in ohe.columns:
-                        self._one_hot_vector_features_to_features[one_hot_vector_feature] = feature
+                    if save_mapping:
+                        for one_hot_vector_feature in ohe.columns:
+                            self._one_hot_vector_features_to_features[one_hot_vector_feature] = feature
                     X = pd.concat([X, ohe], axis=1)
                     features_to_remove.append(feature)
                 except KeyError:
                     print("feature " + feature + "not found in training data")
 
-        self._categorical_data = X.drop(features_to_remove, axis=1)
+        new_data = X.drop(features_to_remove, axis=1)
+        if save_mapping:
+            self._encoded_features = new_data.columns
+        return new_data
 
     def _cell_contains_numeric(self, f, range, x):
         i = self._features.index(f)
@@ -538,7 +507,7 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
             return [cell]
 
         cells = []
-        feature = self._categorical_data.columns[feature_index]
+        feature = self._encoded_features[feature_index]
         threshold = self._dt.tree_.threshold[node]
         left_child = self._dt.tree_.children_left[node]
         right_child = self._dt.tree_.children_right[node]
@@ -569,7 +538,7 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
 
     def _modify_cells(self):
         cells = []
-        features = self._categorical_data.columns
+        features = self._encoded_features
         for cell in self.cells:
             new_cell = {'id': cell['id'], 'label': cell['label'], 'ranges': {}, 'categories': {}, 'hist': cell['hist'],
                         'untouched': [], 'representative': None}
@@ -711,11 +680,19 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
         return [(list(set([i for i, v in enumerate(p) if v == 1]) & nodeSet))[0] for p in paths]
 
     def _generalize(self, original_data, prepared_data, level_nodes, cells, cells_by_id):
+        mapping_to_cells = self._map_to_cells(prepared_data, level_nodes, cells_by_id)
+        all_indexes = []
+        for i in range(len(cells)):
+            # get the indexes of all records that map to this cell
+            indexes = [j for j in mapping_to_cells if mapping_to_cells[j]['id'] == cells[i]['id']]
+            all_indexes.append(indexes)
+        return self._generalize_indexes(original_data, cells, all_indexes)
+
+    def _generalize_indexes(self, original_data, cells, all_indexes):
         # prepared data include one hot encoded categorical data + QI
         representatives = pd.DataFrame(columns=self._features)  # empty except for columns
-        generalized = pd.DataFrame(prepared_data, columns=self._categorical_data.columns, copy=True)
         original_data_generalized = pd.DataFrame(original_data, columns=self._features, copy=True)
-        mapping_to_cells = self._map_to_cells(generalized, level_nodes, cells_by_id)
+
         # iterate over cells (leaves in decision tree)
         for i in range(len(cells)):
             # This code just copies the representatives from the cells into another data structure
@@ -731,9 +708,7 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
                 elif feature in representatives.columns.tolist():
                     representatives = representatives.drop(feature, axis=1)
 
-            # get the indexes of all records that map to this cell
-            indexes = [j for j in mapping_to_cells if mapping_to_cells[j]['id'] == cells[i]['id']]
-
+            indexes = all_indexes[i]
             # replaces the values in the representative columns with the representative values
             # (leaves others untouched)
             if indexes and not representatives.columns.empty:
@@ -794,7 +769,7 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
                     cells_by_id = copy.deepcopy(self._cells_by_id)
                     GeneralizeToRepresentative._remove_feature_from_cells(new_cells, cells_by_id, feature)
                     generalized = self._generalize(original_data, prepared_data, nodes, new_cells, cells_by_id)
-                    accuracy_gain = self.estimator.score(ArrayDataset(self._preprocessor.transform(generalized),
+                    accuracy_gain = self.estimator.score(ArrayDataset(self.encoder.transform(generalized),
                                                                       labels)) - current_accuracy
                     if accuracy_gain < 0:
                         accuracy_gain = 0
@@ -817,7 +792,7 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
                     cells_by_id = copy.deepcopy(self._cells_by_id)
                     GeneralizeToRepresentative._remove_feature_from_cells(new_cells, cells_by_id, feature)
                     generalized = self._generalize(original_data, prepared_data, nodes, new_cells, cells_by_id)
-                    accuracy_gain = self.estimator.score(ArrayDataset(self._preprocessor.transform(generalized),
+                    accuracy_gain = self.estimator.score(ArrayDataset(self.encoder.transform(generalized),
                                                                       labels)) - current_accuracy
 
                     if accuracy_gain < 0:
@@ -838,7 +813,7 @@ class GeneralizeToRepresentative(BaseEstimator, MetaEstimatorMixin, TransformerM
         self._remove_categorical_untouched(self._generalizations)
 
     def _find_range_count(self, samples, ranges):
-        samples_df = pd.DataFrame(samples, columns=self._categorical_data.columns)
+        samples_df = pd.DataFrame(samples, columns=self._encoded_features)
         range_counts = {}
         last_value = None
         for r in ranges.keys():
diff --git a/tests/test_minimizer.py b/tests/test_minimizer.py
index dca3ebd..42e5cb2 100644
--- a/tests/test_minimizer.py
+++ b/tests/test_minimizer.py
@@ -74,8 +74,8 @@ def test_minimizer_fit(data):
     predictions = model.predict(ad)
     if predictions.shape[1] > 1:
         predictions = np.argmax(predictions, axis=1)
-
-    gen = GeneralizeToRepresentative(model, target_accuracy=0.5)
+    target_accuracy = 0.5
+    gen = GeneralizeToRepresentative(model, target_accuracy=target_accuracy)
     train_dataset = ArrayDataset(X, predictions, features_names=features)
 
     gen.fit(dataset=train_dataset)
@@ -102,6 +102,9 @@ def test_minimizer_fit(data):
         assert (ncp > 0)
         assert (((transformed[indexes]) != (X[indexes])).any())
 
+    rel_accuracy = model.score(ArrayDataset(transformed, predictions))
+    assert ((rel_accuracy >= target_accuracy) or (target_accuracy - rel_accuracy) <= 0.05)
+
 
 def test_minimizer_fit_pandas(data):
     features = ['age', 'height', 'sex', 'ola']
@@ -145,7 +148,8 @@ def test_minimizer_fit_pandas(data):
 
     # Append classifier to preprocessing pipeline.
     # Now we have a full prediction pipeline.
-    gen = GeneralizeToRepresentative(model, target_accuracy=0.5,
+    target_accuracy = 0.5
+    gen = GeneralizeToRepresentative(model, target_accuracy=target_accuracy,
                                      categorical_features=categorical_features)
     train_dataset = ArrayDataset(X, predictions)
     gen.fit(dataset=train_dataset)
@@ -169,6 +173,9 @@ def test_minimizer_fit_pandas(data):
         assert (ncp > 0)
         assert (((transformed[modified_features]).equals(X[modified_features])) == False)
 
+    rel_accuracy = model.score(ArrayDataset(preprocessor.transform(transformed), predictions))
+    assert ((rel_accuracy >= target_accuracy) or (target_accuracy - rel_accuracy) <= 0.05)
+
 
 def test_minimizer_params_categorical(data):
     # Assume three features, age, sex and height, and boolean label
@@ -226,12 +233,16 @@ def test_minimizer_params_categorical(data):
         predictions = np.argmax(predictions, axis=1)
     # Append classifier to preprocessing pipeline.
     # Now we have a full prediction pipeline.
-    gen = GeneralizeToRepresentative(model, target_accuracy=0.5,
+    target_accuracy = 0.5
+    gen = GeneralizeToRepresentative(model, target_accuracy=target_accuracy,
                                      categorical_features=categorical_features, cells=cells)
     train_dataset = ArrayDataset(X, predictions)
     gen.fit(dataset=train_dataset)
     transformed = gen.transform(dataset=ArrayDataset(X))
 
+    rel_accuracy = model.score(ArrayDataset(preprocessor.transform(transformed), predictions))
+    assert ((rel_accuracy >= target_accuracy) or (target_accuracy - rel_accuracy) <= 0.05)
+
 
 def test_minimizer_fit_QI(data):
     features = ['age', 'height', 'weight']
@@ -257,8 +268,8 @@ def test_minimizer_fit_QI(data):
     predictions = model.predict(ad)
     if predictions.shape[1] > 1:
         predictions = np.argmax(predictions, axis=1)
-
-    gen = GeneralizeToRepresentative(model, target_accuracy=0.5, features_to_minimize=QI)
+    target_accuracy = 0.5
+    gen = GeneralizeToRepresentative(model, target_accuracy=target_accuracy, features_to_minimize=QI)
     train_dataset = ArrayDataset(X, predictions, features_names=features)
     gen.fit(dataset=train_dataset)
     transformed = gen.transform(dataset=ad)
@@ -284,6 +295,9 @@ def test_minimizer_fit_QI(data):
         assert (ncp > 0)
         assert (((transformed[indexes]) != (X[indexes])).any())
 
+    rel_accuracy = model.score(ArrayDataset(transformed, predictions))
+    assert ((rel_accuracy >= target_accuracy) or (target_accuracy - rel_accuracy) <= 0.05)
+
 
 def test_minimizer_fit_pandas_QI(data):
     features = ['age', 'height', 'weight', 'sex', 'ola']
@@ -329,7 +343,8 @@ def test_minimizer_fit_pandas_QI(data):
 
     # Append classifier to preprocessing pipeline.
     # Now we have a full prediction pipeline.
-    gen = GeneralizeToRepresentative(model, target_accuracy=0.5,
+    target_accuracy = 0.5
+    gen = GeneralizeToRepresentative(model, target_accuracy=target_accuracy,
                                      categorical_features=categorical_features, features_to_minimize=QI)
     train_dataset = ArrayDataset(X, predictions)
     gen.fit(dataset=train_dataset)
@@ -356,6 +371,9 @@ def test_minimizer_fit_pandas_QI(data):
         assert (ncp > 0)
         assert (((transformed[modified_features]).equals(X[modified_features])) == False)
 
+    rel_accuracy = model.score(ArrayDataset(preprocessor.transform(transformed), predictions))
+    assert ((rel_accuracy >= target_accuracy) or (target_accuracy - rel_accuracy) <= 0.05)
+
 
 def test_minimize_ndarray_iris():
     features = ['sepal length (cm)', 'sepal width (cm)', 'petal length (cm)', 'petal width (cm)']
@@ -368,8 +386,8 @@ def test_minimize_ndarray_iris():
     predictions = model.predict(ArrayDataset(x_train))
     if predictions.shape[1] > 1:
         predictions = np.argmax(predictions, axis=1)
-
-    gen = GeneralizeToRepresentative(model, target_accuracy=0.3, features_to_minimize=QI)
+    target_accuracy = 0.3
+    gen = GeneralizeToRepresentative(model, target_accuracy=target_accuracy, features_to_minimize=QI)
     # gen.fit(dataset=ArrayDataset(x_train, predictions))
     transformed = gen.fit_transform(dataset=ArrayDataset(x_train, predictions, features_names=features))
     gener = gen.generalizations
@@ -397,6 +415,9 @@ def test_minimize_ndarray_iris():
         assert (ncp > 0)
         assert (((transformed[indexes]) != (x_train[indexes])).any())
 
+    rel_accuracy = model.score(ArrayDataset(transformed, predictions))
+    assert ((rel_accuracy >= target_accuracy) or (target_accuracy - rel_accuracy) <= 0.05)
+
 
 def test_minimize_pandas_adult():
     (x_train, y_train), (x_test, y_test) = get_adult_dataset_pd()
@@ -433,8 +454,8 @@ def test_minimize_pandas_adult():
     predictions = model.predict(ArrayDataset(encoded))
     if predictions.shape[1] > 1:
         predictions = np.argmax(predictions, axis=1)
-
-    gen = GeneralizeToRepresentative(model, target_accuracy=0.7,
+    target_accuracy = 0.7
+    gen = GeneralizeToRepresentative(model, target_accuracy=target_accuracy,
                                      categorical_features=categorical_features, features_to_minimize=QI)
     gen.fit(dataset=ArrayDataset(x_train, predictions, features_names=features))
     transformed = gen.transform(dataset=ArrayDataset(x_train))
@@ -472,6 +493,9 @@ def test_minimize_pandas_adult():
         assert (ncp > 0)
         assert (((transformed[modified_features]).equals(x_train[modified_features])) == False)
 
+    rel_accuracy = model.score(ArrayDataset(preprocessor.transform(transformed), predictions))
+    assert ((rel_accuracy >= target_accuracy) or (target_accuracy - rel_accuracy) <= 0.05)
+
 
 def test_german_credit_pandas():
     (x_train, y_train), (x_test, y_test) = get_german_credit_dataset_pd()
@@ -506,8 +530,8 @@ def test_german_credit_pandas():
     predictions = model.predict(ArrayDataset(encoded))
     if predictions.shape[1] > 1:
         predictions = np.argmax(predictions, axis=1)
-
-    gen = GeneralizeToRepresentative(model, target_accuracy=0.7,
+    target_accuracy = 0.7
+    gen = GeneralizeToRepresentative(model, target_accuracy=target_accuracy,
                                      categorical_features=categorical_features, features_to_minimize=QI)
     gen.fit(dataset=ArrayDataset(x_train, predictions))
     transformed = gen.transform(dataset=ArrayDataset(x_train))
@@ -545,6 +569,9 @@ def test_german_credit_pandas():
         assert (ncp > 0)
         assert (((transformed[modified_features]).equals(x_train[modified_features])) == False)
 
+    rel_accuracy = model.score(ArrayDataset(preprocessor.transform(transformed), predictions))
+    assert ((rel_accuracy >= target_accuracy) or (target_accuracy - rel_accuracy) <= 0.05)
+
 
 def test_regression():
     dataset = load_diabetes()
@@ -558,7 +585,8 @@ def test_regression():
     features = ['age', 'sex', 'bmi', 'bp',
                 's1', 's2', 's3', 's4', 's5', 's6']
 
-    gen = GeneralizeToRepresentative(model, target_accuracy=0.7, is_regression=True,
+    target_accuracy = 0.7
+    gen = GeneralizeToRepresentative(model, target_accuracy=target_accuracy, is_regression=True,
                                      features_to_minimize=QI)
     gen.fit(dataset=ArrayDataset(x_train, predictions, features_names=features))
     transformed = gen.transform(dataset=ArrayDataset(x_train, features_names=features))
@@ -615,6 +643,9 @@ def test_regression():
         assert (ncp > 0)
         assert (((transformed[indexes]) != (x_train[indexes])).any())
 
+    rel_accuracy = model.score(ArrayDataset(transformed, predictions))
+    assert ((rel_accuracy >= target_accuracy) or (target_accuracy - rel_accuracy) <= 0.05)
+
 
 def test_X_y(data):
     features = [0, 1, 2]
@@ -640,8 +671,8 @@ def test_X_y(data):
     predictions = model.predict(ad)
     if predictions.shape[1] > 1:
         predictions = np.argmax(predictions, axis=1)
-
-    gen = GeneralizeToRepresentative(model, target_accuracy=0.5, features_to_minimize=QI)
+    target_accuracy = 0.5
+    gen = GeneralizeToRepresentative(model, target_accuracy=target_accuracy, features_to_minimize=QI)
     gen.fit(X=X, y=predictions)
     transformed = gen.transform(X)
     gener = gen.generalizations
@@ -666,6 +697,9 @@ def test_X_y(data):
         assert (ncp > 0)
         assert (((transformed[indexes]) != (X[indexes])).any())
 
+    rel_accuracy = model.score(ArrayDataset(transformed, predictions))
+    assert ((rel_accuracy >= target_accuracy) or (target_accuracy - rel_accuracy) <= 0.05)
+
 
 def test_X_y_features_names(data):
     features = ['age', 'height', 'weight']
@@ -691,8 +725,8 @@ def test_X_y_features_names(data):
     predictions = model.predict(ad)
     if predictions.shape[1] > 1:
         predictions = np.argmax(predictions, axis=1)
-
-    gen = GeneralizeToRepresentative(model, target_accuracy=0.5, features_to_minimize=QI)
+    target_accuracy = 0.5
+    gen = GeneralizeToRepresentative(model, target_accuracy=target_accuracy, features_to_minimize=QI)
     gen.fit(X=X, y=predictions, features_names=features)
     transformed = gen.transform(X=X, features_names=features)
     gener = gen.generalizations
@@ -717,6 +751,9 @@ def test_X_y_features_names(data):
         assert (ncp > 0)
         assert (((transformed[indexes]) != (X[indexes])).any())
 
+    rel_accuracy = model.score(ArrayDataset(transformed, predictions))
+    assert ((rel_accuracy >= target_accuracy) or (target_accuracy - rel_accuracy) <= 0.05)
+
 
 def test_BaseEstimator_classification(data):
     features = ['age', 'height', 'weight', 'sex', 'ola']
@@ -760,7 +797,8 @@ def test_BaseEstimator_classification(data):
 
     # Append classifier to preprocessing pipeline.
     # Now we have a full prediction pipeline.
-    gen = GeneralizeToRepresentative(model, target_accuracy=0.5,
+    target_accuracy = 0.5
+    gen = GeneralizeToRepresentative(model, target_accuracy=target_accuracy,
                                      categorical_features=categorical_features, features_to_minimize=QI)
     train_dataset = ArrayDataset(X, predictions)
     gen.fit(dataset=train_dataset)
@@ -787,6 +825,9 @@ def test_BaseEstimator_classification(data):
         assert (ncp > 0)
         assert (((transformed[modified_features]).equals(X[modified_features])) == False)
 
+    rel_accuracy = model.score(preprocessor.transform(transformed), predictions)
+    assert ((rel_accuracy >= target_accuracy) or (target_accuracy - rel_accuracy) <= 0.05)
+
 
 def test_BaseEstimator_regression():
     dataset = load_diabetes()
@@ -799,8 +840,8 @@ def test_BaseEstimator_regression():
     QI = ['age', 'bmi', 's2', 's5']
     features = ['age', 'sex', 'bmi', 'bp',
                 's1', 's2', 's3', 's4', 's5', 's6']
-
-    gen = GeneralizeToRepresentative(model, target_accuracy=0.7, is_regression=True,
+    target_accuracy = 0.7
+    gen = GeneralizeToRepresentative(model, target_accuracy=target_accuracy, is_regression=True,
                                      features_to_minimize=QI)
     gen.fit(dataset=ArrayDataset(x_train, predictions, features_names=features))
     transformed = gen.transform(dataset=ArrayDataset(x_train, features_names=features))
@@ -857,6 +898,9 @@ def test_BaseEstimator_regression():
         assert (ncp > 0)
         assert (((transformed[indexes]) != (x_train[indexes])).any())
 
+    rel_accuracy = model.score(transformed, predictions)
+    assert ((rel_accuracy >= target_accuracy) or (target_accuracy - rel_accuracy) <= 0.05)
+
 
 def test_keras_model():
     (X, y), (x_test, y_test) = get_iris_dataset_np()
@@ -874,8 +918,8 @@ def test_keras_model():
     predictions = model.predict(ad)
     if predictions.shape[1] > 1:
         predictions = np.argmax(predictions, axis=1)
-
-    gen = GeneralizeToRepresentative(model, target_accuracy=0.5)
+    target_accuracy = 0.5
+    gen = GeneralizeToRepresentative(model, target_accuracy=target_accuracy)
     test_dataset = ArrayDataset(x_test, predictions)
 
     gen.fit(dataset=test_dataset)
@@ -895,6 +939,9 @@ def test_keras_model():
         assert (ncp > 0)
         assert (((transformed[indexes]) != (X[indexes])).any())
 
+    rel_accuracy = model.score(ArrayDataset(transformed, predictions))
+    assert ((rel_accuracy >= target_accuracy) or (target_accuracy - rel_accuracy) <= 0.05)
+
 
 def test_blackbox_model():
     (X, y), (x_test, y_test) = get_iris_dataset_np()
@@ -907,8 +954,8 @@ def test_blackbox_model():
     predictions = model.predict(ad)
     if predictions.shape[1] > 1:
         predictions = np.argmax(predictions, axis=1)
-
-    gen = GeneralizeToRepresentative(model, target_accuracy=0.5)
+    target_accuracy = 0.5
+    gen = GeneralizeToRepresentative(model, target_accuracy=target_accuracy)
     train_dataset = ArrayDataset(x_test, predictions)
 
     gen.fit(dataset=train_dataset)
@@ -939,6 +986,9 @@ def test_blackbox_model():
         assert (ncp > 0)
         assert (((transformed[indexes]) != (X[indexes])).any())
 
+    rel_accuracy = model.score(ArrayDataset(transformed, predictions))
+    assert ((rel_accuracy >= target_accuracy) or (target_accuracy - rel_accuracy) <= 0.05)
+
 
 def test_untouched():
     cells = [{"id": 1, "ranges": {"age": {"start": None, "end": 38}}, "label": 0,

From 1c4b963add69e6cd12fe5d2e5c85f94de29595ec Mon Sep 17 00:00:00 2001
From: Shlomit Shachor <shlomiti@il.ibm.com>
Date: Sun, 26 Jun 2022 14:43:22 +0300
Subject: [PATCH 13/26] Wrappers no train (#40)

1) Handle train None in Data
2) Update BB Classifier to handle None either for train or test (x or y)
---
 apt/utils/datasets/datasets.py |  4 ++
 apt/utils/models/model.py      | 37 ++++++++++++-----
 tests/test_model.py            | 72 ++++++++++++++++++++++++++++++++++
 3 files changed, 103 insertions(+), 10 deletions(-)

diff --git a/apt/utils/datasets/datasets.py b/apt/utils/datasets/datasets.py
index 02d886e..6569b37 100644
--- a/apt/utils/datasets/datasets.py
+++ b/apt/utils/datasets/datasets.py
@@ -400,6 +400,8 @@ class Data:
 
         :return: training samples
         """
+        if self.train is None:
+            return None
         return self.train.get_samples()
 
     def get_train_labels(self) -> Collection[Any]:
@@ -408,6 +410,8 @@ class Data:
 
         :return: training labels
         """
+        if self.train is None:
+            return None
         return self.train.get_labels()
 
     def get_test_samples(self) -> Collection[Any]:
diff --git a/apt/utils/models/model.py b/apt/utils/models/model.py
index 7af3a01..bba743b 100644
--- a/apt/utils/models/model.py
+++ b/apt/utils/models/model.py
@@ -153,19 +153,36 @@ class BlackboxClassifier(Model):
     def __init__(self, model: Data, output_type: ModelOutputType, black_box_access: Optional[bool] = True,
                  unlimited_queries: Optional[bool] = True, **kwargs):
         super().__init__(model, output_type, black_box_access=True, unlimited_queries=False, **kwargs)
-        x = model.get_train_samples()
-        y = model.get_train_labels()
-        self.nb_classes = self.get_nb_classes(y)
-        y = check_and_transform_label_format(y, nb_classes=self.nb_classes)
+        x_train_pred = model.get_train_samples()
+        y_train_pred = model.get_train_labels()
+        x_test_pred = model.get_test_samples()
+        y_test_pred = model.get_test_labels()
 
-        if model.get_test_samples() is not None and type(x) == np.ndarray:
-            x = np.vstack((x, model.get_test_samples()))
+        if x_train_pred is not None and y_train_pred is not None and x_test_pred is not None and y_test_pred is not None:
+            if type(y_train_pred) != np.ndarray or type(y_test_pred) != np.ndarray \
+               or type(y_train_pred) != np.ndarray or type(y_test_pred) != np.ndarray:
+                raise NotImplementedError("X/Y Data should be np ndarray")
 
-        if model.get_test_labels() is not None and type(y) == np.ndarray:
-            y = np.vstack((y, check_and_transform_label_format(model.get_test_labels(), nb_classes=self.nb_classes)))
+            self.nb_classes = self.get_nb_classes(y_train_pred)
+            y_train_pred = check_and_transform_label_format(y_train_pred, nb_classes=self.nb_classes)
+            y_test_pred = check_and_transform_label_format(y_test_pred, nb_classes=self.nb_classes)
+            x_pred = np.vstack((x_train_pred, x_test_pred))
+            y_pred = np.vstack((y_train_pred, y_test_pred))
+        elif x_test_pred is not None and y_test_pred is not None:
+            self.nb_classes = self.get_nb_classes(y_test_pred)
+            y_test_pred = check_and_transform_label_format(y_test_pred, nb_classes=self.nb_classes)
+            x_pred = x_test_pred
+            y_pred = y_test_pred
+        elif x_train_pred is not None and y_train_pred is not None:
+            self.nb_classes = self.get_nb_classes(y_train_pred)
+            y_train_pred = check_and_transform_label_format(y_train_pred, nb_classes=self.nb_classes)
+            x_pred = x_train_pred
+            y_pred = y_train_pred
+        else:
+            raise NotImplementedError("Invalid data - None")
 
-        predict_fn = (x, y)
-        self._art_model = BlackBoxClassifier(predict_fn, x.shape[1:], self.nb_classes, fuzzy_float_compare=True)
+        predict_fn = (x_pred, y_pred)
+        self._art_model = BlackBoxClassifier(predict_fn, x_pred.shape[1:], self.nb_classes, fuzzy_float_compare=True)
 
     def fit(self, train_data: Dataset, **kwargs) -> None:
         """
diff --git a/tests/test_model.py b/tests/test_model.py
index 4470658..3a5e45c 100644
--- a/tests/test_model.py
+++ b/tests/test_model.py
@@ -73,3 +73,75 @@ def test_blackbox_classifier():
 
     score = model.score(test)
     assert(0.0 <= score <= 1.0)
+
+def test_blackbox_classifier_no_test():
+    (x_train, y_train), (_, _) = dataset_utils.get_iris_dataset_np()
+
+    train = ArrayDataset(x_train, y_train)
+
+    data = Data(train)
+    model = BlackboxClassifier(data, ModelOutputType.CLASSIFIER_PROBABILITIES)
+    pred = model.predict(train)
+    assert(pred.shape[0] == x_train.shape[0])
+
+    score = model.score(train)
+    assert(0.0 <= score <= 1.0)
+
+
+def test_blackbox_classifier_no_train():
+    (_, _), (x_test, y_test) = dataset_utils.get_iris_dataset_np()
+
+    test = ArrayDataset(x_test, y_test)
+    data = Data(test=test)
+    model = BlackboxClassifier(data, ModelOutputType.CLASSIFIER_PROBABILITIES)
+    pred = model.predict(test)
+    assert(pred.shape[0] == x_test.shape[0])
+
+    score = model.score(test)
+    assert(0.0 <= score <= 1.0)
+
+
+def test_blackbox_classifier_no_test_y():
+    (x_train, y_train), (x_test, _) = dataset_utils.get_iris_dataset_np()
+
+    train = ArrayDataset(x_train, y_train)
+    test = ArrayDataset(x_test)
+    data = Data(train, test)
+    model = BlackboxClassifier(data, ModelOutputType.CLASSIFIER_PROBABILITIES)
+    pred = model.predict(train)
+    assert(pred.shape[0] == x_train.shape[0])
+
+    score = model.score(train)
+    assert(0.0 <= score <= 1.0)
+
+    # since no test_y, BBC should use only test thus predict test should fail
+    unable_to_predict_test = False
+    try:
+        model.predict(test)
+    except  BaseException:
+        unable_to_predict_test = True
+
+    assert (unable_to_predict_test, True)
+
+def test_blackbox_classifier_no_train_y():
+    (x_train, _), (x_test, y_test) = dataset_utils.get_iris_dataset_np()
+
+    train = ArrayDataset(x_train)
+    test = ArrayDataset(x_test, y_test)
+    data = Data(train, test)
+    model = BlackboxClassifier(data, ModelOutputType.CLASSIFIER_PROBABILITIES)
+    pred = model.predict(test)
+    assert (pred.shape[0] == x_test.shape[0])
+
+    score = model.score(test)
+    assert (0.0 <= score <= 1.0)
+
+    # since no train_y, BBC should use only test thus predict train should fail
+    unable_to_predict_train = False
+    try:
+        model.predict(train)
+    except BaseException:
+        unable_to_predict_train = True
+
+    assert(unable_to_predict_train,True)
+

From bb224cd3dd48b3a987dfde9fc5b56d817a8f4eea Mon Sep 17 00:00:00 2001
From: Natalia Razinkov <97098247+NataliRa@users.noreply.github.com>
Date: Sun, 26 Jun 2022 15:15:51 +0300
Subject: [PATCH 14/26] Bug fix for PytorchData dataset

---
 apt/utils/datasets/datasets.py | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/apt/utils/datasets/datasets.py b/apt/utils/datasets/datasets.py
index 6569b37..a386226 100644
--- a/apt/utils/datasets/datasets.py
+++ b/apt/utils/datasets/datasets.py
@@ -292,7 +292,7 @@ class PytorchData(Dataset):
         :type idx: int
         :return: the sample as a pytorch Tensor
         """
-        return self.x[idx]
+        return self._x[idx]
 
     def get_item(self, idx: int) -> Tensor:
         """
@@ -302,11 +302,11 @@ class PytorchData(Dataset):
         :type idx: int
         :return: the sample and label as pytorch Tensors. Returned as a tuple (sample, label)
         """
-        sample, label = self.x[idx], self.y[idx]
+        sample, label = self._x[idx], self._y[idx]
         return sample, label
 
     def __len__(self):
-        return len(self.x)
+        return len(self._x)
 
 
 class DatasetFactory:

From c6eb553a9f4bd7bfb33be840d254423e0b8c06ae Mon Sep 17 00:00:00 2001
From: abigailgold <57357634+abigailgold@users.noreply.github.com>
Date: Thu, 30 Jun 2022 18:23:53 +0300
Subject: [PATCH 15/26] Blackbox predict method (#43)

* Support output probabilities
* Support black box classifier with predict method
* Update requirements (security alert #1)
---
 apt/utils/models/__init__.py |   3 +-
 apt/utils/models/model.py    | 150 +++++++++++++++++++++++++----------
 requirements.txt             |   2 +-
 tests/test_minimizer.py      |   5 +-
 tests/test_model.py          |  49 ++++++++++--
 5 files changed, 159 insertions(+), 50 deletions(-)

diff --git a/apt/utils/models/__init__.py b/apt/utils/models/__init__.py
index f6a89fc..a48a1a3 100644
--- a/apt/utils/models/__init__.py
+++ b/apt/utils/models/__init__.py
@@ -1,3 +1,4 @@
-from apt.utils.models.model import Model, BlackboxClassifier, ModelOutputType, ScoringMethod
+from apt.utils.models.model import Model, BlackboxClassifier, ModelOutputType, ScoringMethod, \
+    BlackboxClassifierPredictions, BlackboxClassifierPredictFunction
 from apt.utils.models.sklearn_model import SklearnModel, SklearnClassifier, SklearnRegressor
 from apt.utils.models.keras_model import KerasClassifier
diff --git a/apt/utils/models/model.py b/apt/utils/models/model.py
index bba743b..eff9271 100644
--- a/apt/utils/models/model.py
+++ b/apt/utils/models/model.py
@@ -1,5 +1,5 @@
 from abc import ABCMeta, abstractmethod
-from typing import Any, Optional
+from typing import Any, Optional, Callable, Tuple
 from enum import Enum, auto
 import numpy as np
 
@@ -126,7 +126,7 @@ class Model(metaclass=ABCMeta):
         :return: the number of classes as integer
         """
         if len(y.shape) == 1:
-            return len(np.unique(y))
+            return np.max(y) + 1
         else:
             return y.shape[1]
 
@@ -135,54 +135,41 @@ class BlackboxClassifier(Model):
     """
     Wrapper for black-box ML classification models.
 
-    :param model: The training and/or test data along with the model's predictions for the data. Assumes that the data
-                  is represented as numpy arrays. Labels are expected to either be one-hot encoded or
-                  a 1D-array of categorical labels (consecutive integers starting at 0).
-    :type model: `Data` object
-    :param output_type: The type of output the model yields (vector/label only for classifiers,
-                        value for regressors)
+    :param model: The training and/or test data along with the model's predictions for the data or a callable predict
+                  method.
+    :type model: `Data` object or Callable
+    :param output_type: The type of output the model yields (vector/label only)
     :type output_type: `ModelOutputType`
     :param black_box_access: Boolean describing the type of deployment of the model (when in production).
-                             Always assumed to be True for this wrapper.
+                             Always assumed to be True (black box) for this wrapper.
     :type black_box_access: boolean, optional
     :param unlimited_queries: Boolean indicating whether a user can perform unlimited queries to the model API.
-                              Always assumed to be False for this wrapper.
     :type unlimited_queries: boolean, optional
     """
 
-    def __init__(self, model: Data, output_type: ModelOutputType, black_box_access: Optional[bool] = True,
+    def __init__(self, model: Any, output_type: ModelOutputType, black_box_access: Optional[bool] = True,
                  unlimited_queries: Optional[bool] = True, **kwargs):
-        super().__init__(model, output_type, black_box_access=True, unlimited_queries=False, **kwargs)
-        x_train_pred = model.get_train_samples()
-        y_train_pred = model.get_train_labels()
-        x_test_pred = model.get_test_samples()
-        y_test_pred = model.get_test_labels()
+        super().__init__(model, output_type, black_box_access=True, unlimited_queries=unlimited_queries, **kwargs)
+        self._nb_classes = None
+        self._input_shape = None
 
-        if x_train_pred is not None and y_train_pred is not None and x_test_pred is not None and y_test_pred is not None:
-            if type(y_train_pred) != np.ndarray or type(y_test_pred) != np.ndarray \
-               or type(y_train_pred) != np.ndarray or type(y_test_pred) != np.ndarray:
-                raise NotImplementedError("X/Y Data should be np ndarray")
+    @property
+    def nb_classes(self) -> int:
+        """
+        Return the number of prediction classes of the model.
 
-            self.nb_classes = self.get_nb_classes(y_train_pred)
-            y_train_pred = check_and_transform_label_format(y_train_pred, nb_classes=self.nb_classes)
-            y_test_pred = check_and_transform_label_format(y_test_pred, nb_classes=self.nb_classes)
-            x_pred = np.vstack((x_train_pred, x_test_pred))
-            y_pred = np.vstack((y_train_pred, y_test_pred))
-        elif x_test_pred is not None and y_test_pred is not None:
-            self.nb_classes = self.get_nb_classes(y_test_pred)
-            y_test_pred = check_and_transform_label_format(y_test_pred, nb_classes=self.nb_classes)
-            x_pred = x_test_pred
-            y_pred = y_test_pred
-        elif x_train_pred is not None and y_train_pred is not None:
-            self.nb_classes = self.get_nb_classes(y_train_pred)
-            y_train_pred = check_and_transform_label_format(y_train_pred, nb_classes=self.nb_classes)
-            x_pred = x_train_pred
-            y_pred = y_train_pred
-        else:
-            raise NotImplementedError("Invalid data - None")
+        :return: Number of prediction classes of the model.
+        """
+        return self._nb_classes
 
-        predict_fn = (x_pred, y_pred)
-        self._art_model = BlackBoxClassifier(predict_fn, x_pred.shape[1:], self.nb_classes, fuzzy_float_compare=True)
+    @property
+    def input_shape(self) -> Tuple[int, ...]:
+        """
+        Return the shape of input to the model.
+
+        :return: Shape of input to the model.
+        """
+        return self._input_shape
 
     def fit(self, train_data: Dataset, **kwargs) -> None:
         """
@@ -212,8 +199,91 @@ class BlackboxClassifier(Model):
         :return: the score as float (for classifiers, between 0 and 1)
         """
         predicted = self._art_model.predict(test_data.get_samples())
-        y = check_and_transform_label_format(test_data.get_labels(), nb_classes=self.nb_classes)
+        y = check_and_transform_label_format(test_data.get_labels(), nb_classes=self._nb_classes)
         if scoring_method == ScoringMethod.ACCURACY:
             return np.count_nonzero(np.argmax(y, axis=1) == np.argmax(predicted, axis=1)) / predicted.shape[0]
         else:
             raise NotImplementedError
+
+
+class BlackboxClassifierPredictions(BlackboxClassifier):
+    """
+    Wrapper for black-box ML classification models using data and predictions.
+
+    :param model: The training and/or test data along with the model's predictions for the data. Assumes that the data
+                  is represented as numpy arrays. Labels are expected to either be class probabilities (multi-column) or
+                  a 1D-array of categorical labels (consecutive integers starting at 0).
+    :type model: `Data` object
+    :param output_type: The type of output the model yields (vector/label only)
+    :type output_type: `ModelOutputType`
+    :param black_box_access: Boolean describing the type of deployment of the model (when in production).
+                             Always assumed to be True for this wrapper.
+    :type black_box_access: boolean, optional
+    :param unlimited_queries: Boolean indicating whether a user can perform unlimited queries to the model API.
+                              Always assumed to be False for this wrapper.
+    :type unlimited_queries: boolean, optional
+    """
+
+    def __init__(self, model: Data, output_type: ModelOutputType, black_box_access: Optional[bool] = True,
+                 unlimited_queries: Optional[bool] = True, **kwargs):
+        super().__init__(model, output_type, black_box_access=True, unlimited_queries=False, **kwargs)
+        x_train_pred = model.get_train_samples()
+        y_train_pred = model.get_train_labels()
+        x_test_pred = model.get_test_samples()
+        y_test_pred = model.get_test_labels()
+
+        if y_train_pred is not None and len(y_train_pred.shape) == 1:
+            self._nb_classes = self.get_nb_classes(y_train_pred)
+            y_train_pred = check_and_transform_label_format(y_train_pred, nb_classes=self._nb_classes)
+        if y_test_pred is not None and len(y_test_pred.shape) == 1:
+            if self._nb_classes is None:
+                self._nb_classes = self.get_nb_classes(y_test_pred)
+            y_test_pred = check_and_transform_label_format(y_test_pred, nb_classes=self._nb_classes)
+
+        if x_train_pred is not None and y_train_pred is not None and x_test_pred is not None and y_test_pred is not None:
+            if type(y_train_pred) != np.ndarray or type(y_test_pred) != np.ndarray \
+               or type(y_train_pred) != np.ndarray or type(y_test_pred) != np.ndarray:
+                raise NotImplementedError("X/Y Data should be numpy array")
+            x_pred = np.vstack((x_train_pred, x_test_pred))
+            y_pred = np.vstack((y_train_pred, y_test_pred))
+        elif x_test_pred is not None and y_test_pred is not None:
+            x_pred = x_test_pred
+            y_pred = y_test_pred
+        elif x_train_pred is not None and y_train_pred is not None:
+            x_pred = x_train_pred
+            y_pred = y_train_pred
+        else:
+            raise NotImplementedError("Invalid data - None")
+
+        self._nb_classes = self.get_nb_classes(y_pred)
+        self._input_shape = x_pred.shape[1:]
+        predict_fn = (x_pred, y_pred)
+        self._art_model = BlackBoxClassifier(predict_fn, self._input_shape, self._nb_classes, fuzzy_float_compare=True)
+
+
+class BlackboxClassifierPredictFunction(BlackboxClassifier):
+    """
+    Wrapper for black-box ML classification models using a predict function.
+
+    :param model: Function that takes in an `np.ndarray` of input data and returns predictions either as class
+                  probabilities (multi-column) or a 1D-array of categorical labels (consecutive integers starting at 0).
+    :type model: Callable
+    :param output_type: The type of output the model yields (vector/label only)
+    :type output_type: `ModelOutputType`
+    :param input_shape: Shape of input to the model.
+    :type input_shape: Tuple[int, ...]
+    :param nb_classes: Number of prediction classes of the model.
+    :type  nb_classes: int
+    :param black_box_access: Boolean describing the type of deployment of the model (when in production).
+                             Always assumed to be True for this wrapper.
+    :type black_box_access: boolean, optional
+    :param unlimited_queries: Boolean indicating whether a user can perform unlimited queries to the model API.
+    :type unlimited_queries: boolean, optional
+    """
+
+    def __init__(self, model: Callable, output_type: ModelOutputType, input_shape: Tuple[int, ...], nb_classes: int,
+                 black_box_access: Optional[bool] = True, unlimited_queries: Optional[bool] = True, **kwargs):
+        super().__init__(model, output_type, black_box_access=True, unlimited_queries=unlimited_queries, **kwargs)
+        self._nb_classes = nb_classes
+        self._input_shape = input_shape
+        self._art_model = BlackBoxClassifier(model, self._input_shape, self._nb_classes)
diff --git a/requirements.txt b/requirements.txt
index f841d7c..4ce8d46 100644
--- a/requirements.txt
+++ b/requirements.txt
@@ -1,4 +1,4 @@
-numpy==1.21.0
+numpy>=1.22
 pandas==1.1.0
 scipy==1.4.1
 scikit-learn==0.22.2
diff --git a/tests/test_minimizer.py b/tests/test_minimizer.py
index 42e5cb2..2d888bc 100644
--- a/tests/test_minimizer.py
+++ b/tests/test_minimizer.py
@@ -18,7 +18,8 @@ from apt.minimization import GeneralizeToRepresentative
 from sklearn.tree import DecisionTreeClassifier, DecisionTreeRegressor
 from apt.utils.dataset_utils import get_iris_dataset_np, get_adult_dataset_pd, get_german_credit_dataset_pd
 from apt.utils.datasets import ArrayDataset, Data
-from apt.utils.models import SklearnClassifier, ModelOutputType, SklearnRegressor, KerasClassifier, BlackboxClassifier
+from apt.utils.models import SklearnClassifier, ModelOutputType, SklearnRegressor, KerasClassifier, \
+    BlackboxClassifierPredictions
 
 
 @pytest.fixture
@@ -949,7 +950,7 @@ def test_blackbox_model():
     test_data = ArrayDataset(x_test, y_test)
     data = Data(train_data, test_data)
 
-    model = BlackboxClassifier(data, ModelOutputType.CLASSIFIER_PROBABILITIES)
+    model = BlackboxClassifierPredictions(data, ModelOutputType.CLASSIFIER_PROBABILITIES)
     ad = ArrayDataset(x_test)
     predictions = model.predict(ad)
     if predictions.shape[1] > 1:
diff --git a/tests/test_model.py b/tests/test_model.py
index 3a5e45c..2acc0d9 100644
--- a/tests/test_model.py
+++ b/tests/test_model.py
@@ -1,6 +1,8 @@
 import pytest
+import numpy as np
 
-from apt.utils.models import SklearnClassifier, SklearnRegressor, ModelOutputType, KerasClassifier, BlackboxClassifier
+from apt.utils.models import SklearnClassifier, SklearnRegressor, ModelOutputType, KerasClassifier, \
+    BlackboxClassifierPredictions, BlackboxClassifierPredictFunction
 from apt.utils.datasets import ArrayDataset, Data
 from apt.utils import dataset_utils
 
@@ -67,7 +69,7 @@ def test_blackbox_classifier():
     train = ArrayDataset(x_train, y_train)
     test = ArrayDataset(x_test, y_test)
     data = Data(train, test)
-    model = BlackboxClassifier(data, ModelOutputType.CLASSIFIER_PROBABILITIES)
+    model = BlackboxClassifierPredictions(data, ModelOutputType.CLASSIFIER_PROBABILITIES)
     pred = model.predict(test)
     assert(pred.shape[0] == x_test.shape[0])
 
@@ -80,7 +82,7 @@ def test_blackbox_classifier_no_test():
     train = ArrayDataset(x_train, y_train)
 
     data = Data(train)
-    model = BlackboxClassifier(data, ModelOutputType.CLASSIFIER_PROBABILITIES)
+    model = BlackboxClassifierPredictions(data, ModelOutputType.CLASSIFIER_PROBABILITIES)
     pred = model.predict(train)
     assert(pred.shape[0] == x_train.shape[0])
 
@@ -93,7 +95,7 @@ def test_blackbox_classifier_no_train():
 
     test = ArrayDataset(x_test, y_test)
     data = Data(test=test)
-    model = BlackboxClassifier(data, ModelOutputType.CLASSIFIER_PROBABILITIES)
+    model = BlackboxClassifierPredictions(data, ModelOutputType.CLASSIFIER_PROBABILITIES)
     pred = model.predict(test)
     assert(pred.shape[0] == x_test.shape[0])
 
@@ -107,7 +109,7 @@ def test_blackbox_classifier_no_test_y():
     train = ArrayDataset(x_train, y_train)
     test = ArrayDataset(x_test)
     data = Data(train, test)
-    model = BlackboxClassifier(data, ModelOutputType.CLASSIFIER_PROBABILITIES)
+    model = BlackboxClassifierPredictions(data, ModelOutputType.CLASSIFIER_PROBABILITIES)
     pred = model.predict(train)
     assert(pred.shape[0] == x_train.shape[0])
 
@@ -129,7 +131,7 @@ def test_blackbox_classifier_no_train_y():
     train = ArrayDataset(x_train)
     test = ArrayDataset(x_test, y_test)
     data = Data(train, test)
-    model = BlackboxClassifier(data, ModelOutputType.CLASSIFIER_PROBABILITIES)
+    model = BlackboxClassifierPredictions(data, ModelOutputType.CLASSIFIER_PROBABILITIES)
     pred = model.predict(test)
     assert (pred.shape[0] == x_test.shape[0])
 
@@ -145,3 +147,38 @@ def test_blackbox_classifier_no_train_y():
 
     assert(unable_to_predict_train,True)
 
+def test_blackbox_classifier_probabilities():
+    (x_train, _), (_, _) = dataset_utils.get_iris_dataset_np()
+    y_train = np.array([[0.23, 0.56, 0.21] for i in range(105)])
+
+    train = ArrayDataset(x_train, y_train)
+
+    data = Data(train)
+    model = BlackboxClassifierPredictions(data, ModelOutputType.CLASSIFIER_PROBABILITIES)
+    pred = model.predict(train)
+    assert (pred.shape[0] == x_train.shape[0])
+    assert (0.0 < pred).all()
+    assert (pred < 1.0).all()
+
+    score = model.score(train)
+    assert (0.0 <= score <= 1.0)
+
+
+def test_blackbox_classifier_predict():
+    def predict(x):
+        return [0.23, 0.56, 0.21]
+
+    (x_train, y_train), (_, _) = dataset_utils.get_iris_dataset_np()
+
+    train = ArrayDataset(x_train, y_train)
+
+    model = BlackboxClassifierPredictFunction(predict, ModelOutputType.CLASSIFIER_PROBABILITIES, (4,), 3)
+    pred = model.predict(train)
+    assert (pred.shape[0] == x_train.shape[0])
+    assert (0.0 < pred).all()
+    assert (pred < 1.0).all()
+
+    score = model.score(train)
+    assert (0.0 <= score <= 1.0)
+
+

From 50317a8d67fcd1f1c7b3f17aeea5cfc4dd4d6114 Mon Sep 17 00:00:00 2001
From: natali <natali@il.ibm.com>
Date: Sat, 2 Jul 2022 23:29:49 +0300
Subject: [PATCH 16/26] fix for keras model check_and_transform_label_format
 requires nb_classes

---
 apt/utils/models/keras_model.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/apt/utils/models/keras_model.py b/apt/utils/models/keras_model.py
index 12d8ba3..0cb7252 100644
--- a/apt/utils/models/keras_model.py
+++ b/apt/utils/models/keras_model.py
@@ -57,7 +57,7 @@ class KerasClassifier(KerasModel):
         :type train_data: `Dataset`
         :return: None
         """
-        y_encoded = check_and_transform_label_format(train_data.get_labels())
+        y_encoded = check_and_transform_label_format(train_data.get_labels(), self._art_model.nb_classes)
         self._art_model.fit(train_data.get_samples(), y_encoded, **kwargs)
 
     def predict(self, x: Dataset, **kwargs) -> OUTPUT_DATA_ARRAY_TYPE:

From e25e58b2535c3709bc2b8bf7b14cf03e5d8847b9 Mon Sep 17 00:00:00 2001
From: Shlomit Shachor <shlomiti@il.ibm.com>
Date: Tue, 5 Jul 2022 11:32:17 +0300
Subject: [PATCH 17/26] enhance calculation of nb classes  + tests (#45)

* update get_nb_classes method to handle 1-hot and scalar input
---
 apt/utils/models/__init__.py      |  2 +-
 apt/utils/models/model.py         | 40 ++++++++++++++++++++-----------
 apt/utils/models/sklearn_model.py |  4 ++--
 tests/test_model.py               | 34 +++++++++++++++++++++++++-
 4 files changed, 62 insertions(+), 18 deletions(-)

diff --git a/apt/utils/models/__init__.py b/apt/utils/models/__init__.py
index a48a1a3..fe1721b 100644
--- a/apt/utils/models/__init__.py
+++ b/apt/utils/models/__init__.py
@@ -1,4 +1,4 @@
 from apt.utils.models.model import Model, BlackboxClassifier, ModelOutputType, ScoringMethod, \
-    BlackboxClassifierPredictions, BlackboxClassifierPredictFunction
+    BlackboxClassifierPredictions, BlackboxClassifierPredictFunction, get_nb_classes, is_one_hot
 from apt.utils.models.sklearn_model import SklearnModel, SklearnClassifier, SklearnRegressor
 from apt.utils.models.keras_model import KerasClassifier
diff --git a/apt/utils/models/model.py b/apt/utils/models/model.py
index eff9271..ad5b00d 100644
--- a/apt/utils/models/model.py
+++ b/apt/utils/models/model.py
@@ -8,6 +8,29 @@ from art.estimators.classification import BlackBoxClassifier
 from art.utils import check_and_transform_label_format
 
 
+def is_one_hot(y: OUTPUT_DATA_ARRAY_TYPE) -> bool:
+    return len(y.shape) == 2 and y.shape[1] > 1
+
+
+def get_nb_classes(y: OUTPUT_DATA_ARRAY_TYPE) -> int:
+    """
+    Get the number of classes from an array of labels
+
+    :param y: the labels
+    :type y: numpy array
+    :return: the number of classes as integer
+    """
+    if y is None:
+        return 0
+
+    if type(y) != np.ndarray:
+        raise ValueError("Input should be numpy array")
+
+    if is_one_hot(y):
+        return y.shape[1]
+    else:
+        return int(np.max(y) + 1)
+
 class ModelOutputType(Enum):
     CLASSIFIER_PROBABILITIES = auto()  # vector of probabilities
     CLASSIFIER_LOGITS = auto()  # vector of logits
@@ -117,18 +140,7 @@ class Model(metaclass=ABCMeta):
         """
         return self._unlimited_queries
 
-    def get_nb_classes(self, y: OUTPUT_DATA_ARRAY_TYPE) -> int:
-        """
-        Get the number of classes from an array of labels
 
-        :param y: the labels
-        :type y: numpy array
-        :return: the number of classes as integer
-        """
-        if len(y.shape) == 1:
-            return np.max(y) + 1
-        else:
-            return y.shape[1]
 
 
 class BlackboxClassifier(Model):
@@ -233,11 +245,11 @@ class BlackboxClassifierPredictions(BlackboxClassifier):
         y_test_pred = model.get_test_labels()
 
         if y_train_pred is not None and len(y_train_pred.shape) == 1:
-            self._nb_classes = self.get_nb_classes(y_train_pred)
+            self._nb_classes = get_nb_classes(y_train_pred)
             y_train_pred = check_and_transform_label_format(y_train_pred, nb_classes=self._nb_classes)
         if y_test_pred is not None and len(y_test_pred.shape) == 1:
             if self._nb_classes is None:
-                self._nb_classes = self.get_nb_classes(y_test_pred)
+                self._nb_classes = get_nb_classes(y_test_pred)
             y_test_pred = check_and_transform_label_format(y_test_pred, nb_classes=self._nb_classes)
 
         if x_train_pred is not None and y_train_pred is not None and x_test_pred is not None and y_test_pred is not None:
@@ -255,7 +267,7 @@ class BlackboxClassifierPredictions(BlackboxClassifier):
         else:
             raise NotImplementedError("Invalid data - None")
 
-        self._nb_classes = self.get_nb_classes(y_pred)
+        self._nb_classes = get_nb_classes(y_pred)
         self._input_shape = x_pred.shape[1:]
         predict_fn = (x_pred, y_pred)
         self._art_model = BlackBoxClassifier(predict_fn, self._input_shape, self._nb_classes, fuzzy_float_compare=True)
diff --git a/apt/utils/models/sklearn_model.py b/apt/utils/models/sklearn_model.py
index 81294a5..8becc18 100644
--- a/apt/utils/models/sklearn_model.py
+++ b/apt/utils/models/sklearn_model.py
@@ -3,7 +3,7 @@ from typing import Optional
 from sklearn.preprocessing import OneHotEncoder
 from sklearn.base import BaseEstimator
 
-from apt.utils.models import Model, ModelOutputType
+from apt.utils.models import Model, ModelOutputType, get_nb_classes
 from apt.utils.datasets import Dataset, OUTPUT_DATA_ARRAY_TYPE
 
 from art.estimators.classification.scikitlearn import SklearnClassifier as ArtSklearnClassifier
@@ -59,7 +59,7 @@ class SklearnClassifier(SklearnModel):
         :return: None
         """
         y = train_data.get_labels()
-        self.nb_classes = self.get_nb_classes(y)
+        self.nb_classes = get_nb_classes(y)
         y_encoded = check_and_transform_label_format(y, nb_classes=self.nb_classes)
         self._art_model.fit(train_data.get_samples(), y_encoded, **kwargs)
 
diff --git a/tests/test_model.py b/tests/test_model.py
index 2acc0d9..4274a02 100644
--- a/tests/test_model.py
+++ b/tests/test_model.py
@@ -2,7 +2,7 @@ import pytest
 import numpy as np
 
 from apt.utils.models import SklearnClassifier, SklearnRegressor, ModelOutputType, KerasClassifier, \
-    BlackboxClassifierPredictions, BlackboxClassifierPredictFunction
+    BlackboxClassifierPredictions, BlackboxClassifierPredictFunction, is_one_hot, get_nb_classes
 from apt.utils.datasets import ArrayDataset, Data
 from apt.utils import dataset_utils
 
@@ -13,6 +13,9 @@ from tensorflow.keras.models import Sequential
 from tensorflow.keras.layers import Dense, Input
 
 
+from art.utils import to_categorical
+
+
 def test_sklearn_classifier():
     (x_train, y_train), (x_test, y_test) = dataset_utils.get_iris_dataset_np()
     underlying_model = RandomForestClassifier()
@@ -181,4 +184,33 @@ def test_blackbox_classifier_predict():
     score = model.score(train)
     assert (0.0 <= score <= 1.0)
 
+def test_is_one_hot():
+    (_, y_train), (_, _) = dataset_utils.get_iris_dataset_np()
+
+    assert (not is_one_hot(y_train))
+    assert (not is_one_hot(y_train.reshape(-1,1)))
+    assert (is_one_hot(to_categorical(y_train)))
+
+def test_get_nb_classes():
+    (_, y_train), (_, y_test) = dataset_utils.get_iris_dataset_np()
+
+    # shape: (x,) - not 1-hot
+    nb_classes_test = get_nb_classes(y_test)
+    nb_classes_train = get_nb_classes(y_train)
+    assert (nb_classes_test == nb_classes_train)
+    assert (nb_classes_test == 3)
+
+    # shape: (x,1) - not 1-hot
+    nb_classes_test = get_nb_classes(y_test.reshape(-1,1))
+    assert (nb_classes_test == 3)
+
+    # shape: (x,3) - 1-hot
+    y = to_categorical(y_test)
+    nb_classes = get_nb_classes(y)
+    assert (nb_classes == 3)
+
+    # gaps: 1,2,4 (0,3 missing)
+    y_test[y_test == 0] = 4
+    nb_classes = get_nb_classes(y_test)
+    assert (nb_classes == 5)
 

From 00f9c1686320c1c38eca2e1ea6a823988f7465bc Mon Sep 17 00:00:00 2001
From: abigailgold <57357634+abigailgold@users.noreply.github.com>
Date: Mon, 11 Jul 2022 14:28:09 +0300
Subject: [PATCH 18/26] Support additional use cases for data (#46)

* Make ART black box classifier not apply preprocessing to data
* Add option to store predictions (in addition to x,y) in Dataset and Data classes
---
 apt/utils/datasets/__init__.py |  2 +-
 apt/utils/datasets/datasets.py | 91 ++++++++++++++++++++++++++++++++--
 apt/utils/models/model.py      |  5 +-
 tests/test_datasets.py         | 41 +++++++++++++++
 tests/test_minimizer.py        | 47 ------------------
 tests/test_model.py            | 15 +++---
 6 files changed, 139 insertions(+), 62 deletions(-)
 create mode 100644 tests/test_datasets.py

diff --git a/apt/utils/datasets/__init__.py b/apt/utils/datasets/__init__.py
index 6e7c640..6252130 100644
--- a/apt/utils/datasets/__init__.py
+++ b/apt/utils/datasets/__init__.py
@@ -4,4 +4,4 @@ Implementation of datasets utility components for datasets creation, load, and s
 """
 
 from apt.utils.datasets.datasets import Dataset, StoredDataset, DatasetFactory, Data, ArrayDataset, \
-    OUTPUT_DATA_ARRAY_TYPE, DATA_PANDAS_NUMPY_TYPE
+    DatasetWithPredictions, OUTPUT_DATA_ARRAY_TYPE, DATA_PANDAS_NUMPY_TYPE
diff --git a/apt/utils/datasets/datasets.py b/apt/utils/datasets/datasets.py
index a386226..6654e5a 100644
--- a/apt/utils/datasets/datasets.py
+++ b/apt/utils/datasets/datasets.py
@@ -38,7 +38,7 @@ class Dataset(metaclass=ABCMeta):
 
         :return: the data samples
         """
-        pass
+        raise NotImplementedError
 
     @abstractmethod
     def get_labels(self) -> Collection[Any]:
@@ -47,7 +47,16 @@ class Dataset(metaclass=ABCMeta):
 
         :return: the labels
         """
-        pass
+        raise NotImplementedError
+
+    @abstractmethod
+    def get_predictions(self) -> OUTPUT_DATA_ARRAY_TYPE:
+        """
+        Get predictions
+
+        :return: predictions as numpy array
+        """
+        raise NotImplementedError
 
     def _array2numpy(self, arr: INPUT_DATA_ARRAY_TYPE) -> OUTPUT_DATA_ARRAY_TYPE:
         """
@@ -102,7 +111,7 @@ class StoredDataset(Dataset):
         :type path: string
         :return: None
         """
-        pass
+        raise NotImplementedError
 
     @abstractmethod
     def load(self, **kwargs):
@@ -111,7 +120,7 @@ class StoredDataset(Dataset):
 
         :return: None
         """
-        pass
+        raise NotImplementedError
 
     @staticmethod
     def download(url: str, dest_path: str, filename: str, unzip: Optional[bool] = False) -> None:
@@ -224,7 +233,7 @@ class ArrayDataset(Dataset):
                 raise ValueError("The supplied features are not the same as in the data features")
             self.features_names = x.columns.to_list()
 
-        if y is not None and len(self._x) != len(self._y):
+        if self._y is not None and len(self._x) != len(self._y):
             raise ValueError('Non equivalent lengths of x and y')
 
     def get_samples(self) -> OUTPUT_DATA_ARRAY_TYPE:
@@ -243,6 +252,70 @@ class ArrayDataset(Dataset):
         """
         return self._y
 
+    def get_predictions(self) -> OUTPUT_DATA_ARRAY_TYPE:
+        """
+        Get predictions
+
+        :return: predictions as numpy array
+        """
+        raise NotImplementedError
+
+
+class DatasetWithPredictions(Dataset):
+    """
+    Dataset that is based on arrays (e.g., numpy/pandas/list...). Includes predictions from a model, and possibly also
+    features and true labels.
+
+    :param x: collection of data samples
+    :type x: numpy array or pandas DataFrame or list or pytorch Tensor
+    :param y: collection of labels
+    :type y: numpy array or pandas DataFrame or list or pytorch Tensor, optional
+    :param feature_names: The feature names, in the order that they appear in the data
+    :type feature_names: list of strings, optional
+    """
+
+    def __init__(self, pred: INPUT_DATA_ARRAY_TYPE, x: Optional[INPUT_DATA_ARRAY_TYPE] = None,
+                 y: Optional[INPUT_DATA_ARRAY_TYPE] = None, features_names: Optional[list] = None, **kwargs):
+        self.is_pandas = False
+        self.features_names = features_names
+        self._pred = self._array2numpy(pred)
+        self._y = self._array2numpy(y) if y is not None else None
+        self._x = self._array2numpy(x) if x is not None else None
+        if self.is_pandas and x is not None:
+            if features_names and not np.array_equal(features_names, x.columns):
+                raise ValueError("The supplied features are not the same as in the data features")
+            self.features_names = x.columns.to_list()
+
+        if self._y is not None and len(self._pred) != len(self._y):
+            raise ValueError('Non equivalent lengths of pred and y')
+
+        if self._x is not None and len(self._x) != len(self._pred):
+            raise ValueError('Non equivalent lengths of x and pred')
+
+    def get_samples(self) -> OUTPUT_DATA_ARRAY_TYPE:
+        """
+        Get data samples
+
+        :return: data samples as numpy array
+        """
+        return self._x
+
+    def get_labels(self) -> OUTPUT_DATA_ARRAY_TYPE:
+        """
+        Get labels
+
+        :return: labels as numpy array
+        """
+        return self._y
+
+    def get_predictions(self) -> OUTPUT_DATA_ARRAY_TYPE:
+        """
+        Get predictions
+
+        :return: predictions as numpy array
+        """
+        return self._pred
+
 
 class PytorchData(Dataset):
     """
@@ -284,6 +357,14 @@ class PytorchData(Dataset):
         """
         return self._array2numpy(self._y) if self._y is not None else None
 
+    def get_predictions(self) -> OUTPUT_DATA_ARRAY_TYPE:
+        """
+        Get predictions
+
+        :return: predictions as numpy array
+        """
+        raise NotImplementedError
+
     def get_sample_item(self, idx: int) -> Tensor:
         """
         Get the sample according to the given index
diff --git a/apt/utils/models/model.py b/apt/utils/models/model.py
index ad5b00d..8ea837a 100644
--- a/apt/utils/models/model.py
+++ b/apt/utils/models/model.py
@@ -270,7 +270,8 @@ class BlackboxClassifierPredictions(BlackboxClassifier):
         self._nb_classes = get_nb_classes(y_pred)
         self._input_shape = x_pred.shape[1:]
         predict_fn = (x_pred, y_pred)
-        self._art_model = BlackBoxClassifier(predict_fn, self._input_shape, self._nb_classes, fuzzy_float_compare=True)
+        self._art_model = BlackBoxClassifier(predict_fn, self._input_shape, self._nb_classes, fuzzy_float_compare=True,
+                                             preprocessing=None)
 
 
 class BlackboxClassifierPredictFunction(BlackboxClassifier):
@@ -298,4 +299,4 @@ class BlackboxClassifierPredictFunction(BlackboxClassifier):
         super().__init__(model, output_type, black_box_access=True, unlimited_queries=unlimited_queries, **kwargs)
         self._nb_classes = nb_classes
         self._input_shape = input_shape
-        self._art_model = BlackBoxClassifier(model, self._input_shape, self._nb_classes)
+        self._art_model = BlackBoxClassifier(model, self._input_shape, self._nb_classes, preprocessing=None)
diff --git a/tests/test_datasets.py b/tests/test_datasets.py
new file mode 100644
index 0000000..4f57b0c
--- /dev/null
+++ b/tests/test_datasets.py
@@ -0,0 +1,41 @@
+import pytest
+import numpy as np
+
+from apt.utils.datasets import Data, DatasetWithPredictions
+from apt.utils import dataset_utils
+
+
+def test_dataset_predictions():
+    (x_train, y_train), (_, _) = dataset_utils.get_iris_dataset_np()
+    pred = np.array([[0.23, 0.56, 0.21] for i in range(105)])
+
+    dataset = DatasetWithPredictions(pred)
+    data = Data(train=dataset)
+
+    new_pred = data.get_train_set().get_predictions()
+
+    assert np.equal(pred, new_pred).all()
+
+
+def test_dataset_predictions_x():
+    (x_train, y_train), (_, _) = dataset_utils.get_iris_dataset_np()
+    pred = np.array([[0.23, 0.56, 0.21] for i in range(105)])
+
+    dataset = DatasetWithPredictions(pred, x=x_train)
+    data = Data(train=dataset)
+
+    new_pred = data.get_train_set().get_predictions()
+
+    assert np.equal(pred, new_pred).all()
+
+
+def test_dataset_predictions_y():
+    (x_train, y_train), (_, _) = dataset_utils.get_iris_dataset_np()
+    pred = np.array([[0.23, 0.56, 0.21] for i in range(105)])
+
+    dataset = DatasetWithPredictions(pred, x=x_train, y=y_train)
+    data = Data(train=dataset)
+
+    new_pred = data.get_train_set().get_predictions()
+
+    assert np.equal(pred, new_pred).all()
diff --git a/tests/test_minimizer.py b/tests/test_minimizer.py
index 2d888bc..65d6d81 100644
--- a/tests/test_minimizer.py
+++ b/tests/test_minimizer.py
@@ -944,53 +944,6 @@ def test_keras_model():
     assert ((rel_accuracy >= target_accuracy) or (target_accuracy - rel_accuracy) <= 0.05)
 
 
-def test_blackbox_model():
-    (X, y), (x_test, y_test) = get_iris_dataset_np()
-    train_data = ArrayDataset(X, y)
-    test_data = ArrayDataset(x_test, y_test)
-    data = Data(train_data, test_data)
-
-    model = BlackboxClassifierPredictions(data, ModelOutputType.CLASSIFIER_PROBABILITIES)
-    ad = ArrayDataset(x_test)
-    predictions = model.predict(ad)
-    if predictions.shape[1] > 1:
-        predictions = np.argmax(predictions, axis=1)
-    target_accuracy = 0.5
-    gen = GeneralizeToRepresentative(model, target_accuracy=target_accuracy)
-    train_dataset = ArrayDataset(x_test, predictions)
-
-    gen.fit(dataset=train_dataset)
-    transformed = gen.transform(dataset=ad)
-    gener = gen.generalizations
-    expected_generalizations = {'ranges': {'0': [], '1': [], '2': [4.849999904632568], '3': [0.7000000029802322]},
-                                'categories': {},
-                                'untouched': []}
-
-    for key in expected_generalizations['ranges']:
-        assert_almost_equal(expected_generalizations['ranges'][key], gener['ranges'][key])
-    for key in expected_generalizations['categories']:
-        assert (set([frozenset(sl) for sl in expected_generalizations['categories'][key]]) ==
-                set([frozenset(sl) for sl in gener['categories'][key]]))
-    assert (set(expected_generalizations['untouched']) == set(gener['untouched']))
-
-    features = ['0', '1', '2', '3']
-    modified_features = [f for f in features if
-                         f in expected_generalizations['categories'].keys() or f in expected_generalizations[
-                             'ranges'].keys()]
-    indexes = []
-    for i in range(len(features)):
-        if features[i] in modified_features:
-            indexes.append(i)
-    assert ((np.delete(transformed, indexes, axis=1) == np.delete(x_test, indexes, axis=1)).all())
-    ncp = gen.ncp
-    if len(expected_generalizations['ranges'].keys()) > 0 or len(expected_generalizations['categories'].keys()) > 0:
-        assert (ncp > 0)
-        assert (((transformed[indexes]) != (X[indexes])).any())
-
-    rel_accuracy = model.score(ArrayDataset(transformed, predictions))
-    assert ((rel_accuracy >= target_accuracy) or (target_accuracy - rel_accuracy) <= 0.05)
-
-
 def test_untouched():
     cells = [{"id": 1, "ranges": {"age": {"start": None, "end": 38}}, "label": 0,
               'categories': {'gender': ['male']}, "representative": {"age": 26, "height": 149}},
diff --git a/tests/test_model.py b/tests/test_model.py
index 4274a02..138c11c 100644
--- a/tests/test_model.py
+++ b/tests/test_model.py
@@ -77,7 +77,7 @@ def test_blackbox_classifier():
     assert(pred.shape[0] == x_test.shape[0])
 
     score = model.score(test)
-    assert(0.0 <= score <= 1.0)
+    assert(score == 1.0)
 
 def test_blackbox_classifier_no_test():
     (x_train, y_train), (_, _) = dataset_utils.get_iris_dataset_np()
@@ -90,7 +90,7 @@ def test_blackbox_classifier_no_test():
     assert(pred.shape[0] == x_train.shape[0])
 
     score = model.score(train)
-    assert(0.0 <= score <= 1.0)
+    assert (score == 1.0)
 
 
 def test_blackbox_classifier_no_train():
@@ -103,7 +103,7 @@ def test_blackbox_classifier_no_train():
     assert(pred.shape[0] == x_test.shape[0])
 
     score = model.score(test)
-    assert(0.0 <= score <= 1.0)
+    assert (score == 1.0)
 
 
 def test_blackbox_classifier_no_test_y():
@@ -117,7 +117,7 @@ def test_blackbox_classifier_no_test_y():
     assert(pred.shape[0] == x_train.shape[0])
 
     score = model.score(train)
-    assert(0.0 <= score <= 1.0)
+    assert (score == 1.0)
 
     # since no test_y, BBC should use only test thus predict test should fail
     unable_to_predict_test = False
@@ -139,7 +139,7 @@ def test_blackbox_classifier_no_train_y():
     assert (pred.shape[0] == x_test.shape[0])
 
     score = model.score(test)
-    assert (0.0 <= score <= 1.0)
+    assert (score == 1.0)
 
     # since no train_y, BBC should use only test thus predict train should fail
     unable_to_predict_train = False
@@ -164,7 +164,7 @@ def test_blackbox_classifier_probabilities():
     assert (pred < 1.0).all()
 
     score = model.score(train)
-    assert (0.0 <= score <= 1.0)
+    assert (score == 1.0)
 
 
 def test_blackbox_classifier_predict():
@@ -172,6 +172,7 @@ def test_blackbox_classifier_predict():
         return [0.23, 0.56, 0.21]
 
     (x_train, y_train), (_, _) = dataset_utils.get_iris_dataset_np()
+    y_train = np.array([[0.23, 0.56, 0.21] for i in range(105)])
 
     train = ArrayDataset(x_train, y_train)
 
@@ -182,7 +183,7 @@ def test_blackbox_classifier_predict():
     assert (pred < 1.0).all()
 
     score = model.score(train)
-    assert (0.0 <= score <= 1.0)
+    assert (score == 1.0)
 
 def test_is_one_hot():
     (_, y_train), (_, _) = dataset_utils.get_iris_dataset_np()

From bc28f7f26ae219844426dc774054826e948aa078 Mon Sep 17 00:00:00 2001
From: abigailt <abigailt@il.ibm.com>
Date: Tue, 12 Jul 2022 09:45:15 +0300
Subject: [PATCH 19/26] Return None where no predictions are available

---
 apt/utils/datasets/datasets.py | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/apt/utils/datasets/datasets.py b/apt/utils/datasets/datasets.py
index 6654e5a..0ebc998 100644
--- a/apt/utils/datasets/datasets.py
+++ b/apt/utils/datasets/datasets.py
@@ -258,7 +258,7 @@ class ArrayDataset(Dataset):
 
         :return: predictions as numpy array
         """
-        raise NotImplementedError
+        return None
 
 
 class DatasetWithPredictions(Dataset):
@@ -333,7 +333,7 @@ class PytorchData(Dataset):
         if self.is_pandas:
             self.features_names = x.columns
 
-        if y is not None and len(self._x) != len(self._y):
+        if self._y is not None and len(self._x) != len(self._y):
             raise ValueError('Non equivalent lengths of x and y')
 
         if self._y is not None:
@@ -363,7 +363,7 @@ class PytorchData(Dataset):
 
         :return: predictions as numpy array
         """
-        raise NotImplementedError
+        return None
 
     def get_sample_item(self, idx: int) -> Tensor:
         """

From bc7ab0cc7fad202ddafa793d1d3f7ec670d8b6cd Mon Sep 17 00:00:00 2001
From: abigailt <abigailt@il.ibm.com>
Date: Mon, 18 Jul 2022 19:27:14 +0300
Subject: [PATCH 20/26] Add model type to blackbox classifier (#49)

---
 apt/utils/models/model.py | 26 ++++++++++++++++++++++++--
 tests/test_model.py       |  2 ++
 2 files changed, 26 insertions(+), 2 deletions(-)

diff --git a/apt/utils/models/model.py b/apt/utils/models/model.py
index 8ea837a..9e8379d 100644
--- a/apt/utils/models/model.py
+++ b/apt/utils/models/model.py
@@ -1,5 +1,5 @@
 from abc import ABCMeta, abstractmethod
-from typing import Any, Optional, Callable, Tuple
+from typing import Any, Optional, Callable, Tuple, Union
 from enum import Enum, auto
 import numpy as np
 
@@ -31,6 +31,7 @@ def get_nb_classes(y: OUTPUT_DATA_ARRAY_TYPE) -> int:
     else:
         return int(np.max(y) + 1)
 
+
 class ModelOutputType(Enum):
     CLASSIFIER_PROBABILITIES = auto()  # vector of probabilities
     CLASSIFIER_LOGITS = auto()  # vector of logits
@@ -38,6 +39,11 @@ class ModelOutputType(Enum):
     REGRESSOR_SCALAR = auto()  # value
 
 
+class ModelType(Enum):
+    SKLEARN_DECISION_TREE = auto()
+    SKLEARN_GRADIENT_BOOSTING = auto()
+
+
 class ScoringMethod(Enum):
     ACCURACY = auto()  # number of correct predictions divided by the number of samples
     MEAN_SQUARED_ERROR = auto()  # mean squared error between the predictions and true labels
@@ -157,13 +163,19 @@ class BlackboxClassifier(Model):
     :type black_box_access: boolean, optional
     :param unlimited_queries: Boolean indicating whether a user can perform unlimited queries to the model API.
     :type unlimited_queries: boolean, optional
+    :param model_type: The type of model this BlackboxClassifier represents. Needed in order to build and/or fit
+                       similar dummy/shadow models.
+    :type model_type: Either a (unfitted) model object of the underlying framework, or a ModelType representing the
+                      type of the model, optional.
     """
 
     def __init__(self, model: Any, output_type: ModelOutputType, black_box_access: Optional[bool] = True,
-                 unlimited_queries: Optional[bool] = True, **kwargs):
+                 unlimited_queries: Optional[bool] = True, model_type: Optional[Union[Any, ModelType]] = None,
+                 **kwargs):
         super().__init__(model, output_type, black_box_access=True, unlimited_queries=unlimited_queries, **kwargs)
         self._nb_classes = None
         self._input_shape = None
+        self._model_type = model_type
 
     @property
     def nb_classes(self) -> int:
@@ -183,6 +195,16 @@ class BlackboxClassifier(Model):
         """
         return self._input_shape
 
+    @property
+    def model_type(self) -> Optional[Union[Any, ModelType]]:
+        """
+        Return the type of the model.
+
+        :return: Either a (unfitted) model object of the underlying framework, or a ModelType representing the type of
+                 the model, or None (of none provided at init).
+        """
+        return self._model_type
+
     def fit(self, train_data: Dataset, **kwargs) -> None:
         """
         A blackbox model cannot be fit.
diff --git a/tests/test_model.py b/tests/test_model.py
index 138c11c..195ad81 100644
--- a/tests/test_model.py
+++ b/tests/test_model.py
@@ -79,6 +79,8 @@ def test_blackbox_classifier():
     score = model.score(test)
     assert(score == 1.0)
 
+    assert model.model_type is None
+
 def test_blackbox_classifier_no_test():
     (x_train, y_train), (_, _) = dataset_utils.get_iris_dataset_np()
 

From 1cc73b3da15fe6b850f82b22b6881ff61d4d678a Mon Sep 17 00:00:00 2001
From: abigailt <abigailt@il.ibm.com>
Date: Tue, 19 Jul 2022 08:43:19 +0300
Subject: [PATCH 21/26] Check for mismatch between model output type and actual
 output

---
 apt/utils/models/__init__.py      |  3 +-
 apt/utils/models/keras_model.py   |  6 ++-
 apt/utils/models/model.py         | 75 +++++++++++++++++++------------
 apt/utils/models/sklearn_model.py |  6 ++-
 tests/test_model.py               | 24 +++++++---
 5 files changed, 75 insertions(+), 39 deletions(-)

diff --git a/apt/utils/models/__init__.py b/apt/utils/models/__init__.py
index fe1721b..65861f3 100644
--- a/apt/utils/models/__init__.py
+++ b/apt/utils/models/__init__.py
@@ -1,4 +1,5 @@
 from apt.utils.models.model import Model, BlackboxClassifier, ModelOutputType, ScoringMethod, \
-    BlackboxClassifierPredictions, BlackboxClassifierPredictFunction, get_nb_classes, is_one_hot
+    BlackboxClassifierPredictions, BlackboxClassifierPredictFunction, get_nb_classes, is_one_hot, \
+    check_correct_model_output
 from apt.utils.models.sklearn_model import SklearnModel, SklearnClassifier, SklearnRegressor
 from apt.utils.models.keras_model import KerasClassifier
diff --git a/apt/utils/models/keras_model.py b/apt/utils/models/keras_model.py
index 0cb7252..6bce043 100644
--- a/apt/utils/models/keras_model.py
+++ b/apt/utils/models/keras_model.py
@@ -7,7 +7,7 @@ import tensorflow as tf
 from tensorflow import keras
 tf.compat.v1.disable_eager_execution()
 
-from apt.utils.models import Model, ModelOutputType, ScoringMethod
+from apt.utils.models import Model, ModelOutputType, ScoringMethod, check_correct_model_output
 from apt.utils.datasets import Dataset, OUTPUT_DATA_ARRAY_TYPE
 
 from art.utils import check_and_transform_label_format
@@ -68,7 +68,9 @@ class KerasClassifier(KerasModel):
         :type x: `Dataset`
         :return: Predictions from the model as numpy array (class probabilities, if supported).
         """
-        return self._art_model.predict(x.get_samples(), **kwargs)
+        predictions = self._art_model.predict(x.get_samples(), **kwargs)
+        check_correct_model_output(predictions, self.output_type)
+        return predictions
 
     def score(self, test_data: Dataset, scoring_method: Optional[ScoringMethod] = ScoringMethod.ACCURACY, **kwargs):
         """
diff --git a/apt/utils/models/model.py b/apt/utils/models/model.py
index 9e8379d..902a22c 100644
--- a/apt/utils/models/model.py
+++ b/apt/utils/models/model.py
@@ -8,30 +8,6 @@ from art.estimators.classification import BlackBoxClassifier
 from art.utils import check_and_transform_label_format
 
 
-def is_one_hot(y: OUTPUT_DATA_ARRAY_TYPE) -> bool:
-    return len(y.shape) == 2 and y.shape[1] > 1
-
-
-def get_nb_classes(y: OUTPUT_DATA_ARRAY_TYPE) -> int:
-    """
-    Get the number of classes from an array of labels
-
-    :param y: the labels
-    :type y: numpy array
-    :return: the number of classes as integer
-    """
-    if y is None:
-        return 0
-
-    if type(y) != np.ndarray:
-        raise ValueError("Input should be numpy array")
-
-    if is_one_hot(y):
-        return y.shape[1]
-    else:
-        return int(np.max(y) + 1)
-
-
 class ModelOutputType(Enum):
     CLASSIFIER_PROBABILITIES = auto()  # vector of probabilities
     CLASSIFIER_LOGITS = auto()  # vector of logits
@@ -49,6 +25,45 @@ class ScoringMethod(Enum):
     MEAN_SQUARED_ERROR = auto()  # mean squared error between the predictions and true labels
 
 
+def is_one_hot(y: OUTPUT_DATA_ARRAY_TYPE) -> bool:
+    return len(y.shape) == 2 and y.shape[1] > 1
+
+
+def get_nb_classes(y: OUTPUT_DATA_ARRAY_TYPE) -> int:
+    """
+    Get the number of classes from an array of labels
+
+    :param y: The labels
+    :type y: numpy array
+    :return: The number of classes as integer
+    """
+    if y is None:
+        return 0
+
+    if type(y) != np.ndarray:
+        raise ValueError("Input should be numpy array")
+
+    if is_one_hot(y):
+        return y.shape[1]
+    else:
+        return int(np.max(y) + 1)
+
+
+def check_correct_model_output(y: OUTPUT_DATA_ARRAY_TYPE, output_type: ModelOutputType):
+    """
+    Checks whether there is a mismatch between the declared model output type and its actual output.
+    :param y: Model output
+    :type y: numpy array
+    :param output_type: Declared output type (provided at init)
+    :type output_type: ModelOutputType
+    :raises: ValueError (in case of mismatch)
+    """
+    if not is_one_hot(y):  # 1D array
+        if output_type == ModelOutputType.CLASSIFIER_PROBABILITIES or output_type == ModelOutputType.CLASSIFIER_LOGITS:
+            raise ValueError("Incompatible model output types. Model outputs 1D array of categorical scalars while "
+                             "output type is set to ", output_type)
+
+
 class Model(metaclass=ABCMeta):
     """
     Abstract base class for ML model wrappers.
@@ -147,8 +162,6 @@ class Model(metaclass=ABCMeta):
         return self._unlimited_queries
 
 
-
-
 class BlackboxClassifier(Model):
     """
     Wrapper for black-box ML classification models.
@@ -168,7 +181,6 @@ class BlackboxClassifier(Model):
     :type model_type: Either a (unfitted) model object of the underlying framework, or a ModelType representing the
                       type of the model, optional.
     """
-
     def __init__(self, model: Any, output_type: ModelOutputType, black_box_access: Optional[bool] = True,
                  unlimited_queries: Optional[bool] = True, model_type: Optional[Union[Any, ModelType]] = None,
                  **kwargs):
@@ -220,7 +232,9 @@ class BlackboxClassifier(Model):
         :type x: `Dataset`
         :return: Predictions from the model as numpy array.
         """
-        return self._art_model.predict(x.get_samples())
+        predictions = self._art_model.predict(x.get_samples())
+        check_correct_model_output(predictions, self.output_type)
+        return predictions
 
     def score(self, test_data: Dataset, scoring_method: Optional[ScoringMethod] = ScoringMethod.ACCURACY, **kwargs):
         """
@@ -266,6 +280,11 @@ class BlackboxClassifierPredictions(BlackboxClassifier):
         x_test_pred = model.get_test_samples()
         y_test_pred = model.get_test_labels()
 
+        if y_train_pred is not None:
+            check_correct_model_output(y_train_pred, self.output_type)
+        if y_test_pred is not None:
+            check_correct_model_output(y_test_pred, self.output_type)
+
         if y_train_pred is not None and len(y_train_pred.shape) == 1:
             self._nb_classes = get_nb_classes(y_train_pred)
             y_train_pred = check_and_transform_label_format(y_train_pred, nb_classes=self._nb_classes)
diff --git a/apt/utils/models/sklearn_model.py b/apt/utils/models/sklearn_model.py
index 8becc18..c378a24 100644
--- a/apt/utils/models/sklearn_model.py
+++ b/apt/utils/models/sklearn_model.py
@@ -3,7 +3,7 @@ from typing import Optional
 from sklearn.preprocessing import OneHotEncoder
 from sklearn.base import BaseEstimator
 
-from apt.utils.models import Model, ModelOutputType, get_nb_classes
+from apt.utils.models import Model, ModelOutputType, get_nb_classes, check_correct_model_output
 from apt.utils.datasets import Dataset, OUTPUT_DATA_ARRAY_TYPE
 
 from art.estimators.classification.scikitlearn import SklearnClassifier as ArtSklearnClassifier
@@ -71,7 +71,9 @@ class SklearnClassifier(SklearnModel):
         :type x: `Dataset`
         :return: Predictions from the model as numpy array (class probabilities, if supported).
         """
-        return self._art_model.predict(x.get_samples(), **kwargs)
+        predictions = self._art_model.predict(x.get_samples(), **kwargs)
+        check_correct_model_output(predictions, self.output_type)
+        return predictions
 
 
 class SklearnRegressor(SklearnModel):
diff --git a/tests/test_model.py b/tests/test_model.py
index 195ad81..8b4769c 100644
--- a/tests/test_model.py
+++ b/tests/test_model.py
@@ -72,7 +72,7 @@ def test_blackbox_classifier():
     train = ArrayDataset(x_train, y_train)
     test = ArrayDataset(x_test, y_test)
     data = Data(train, test)
-    model = BlackboxClassifierPredictions(data, ModelOutputType.CLASSIFIER_PROBABILITIES)
+    model = BlackboxClassifierPredictions(data, ModelOutputType.CLASSIFIER_SCALAR)
     pred = model.predict(test)
     assert(pred.shape[0] == x_test.shape[0])
 
@@ -81,13 +81,24 @@ def test_blackbox_classifier():
 
     assert model.model_type is None
 
+
+def test_blackbox_classifier_mismatch():
+    (x_train, y_train), (x_test, y_test) = dataset_utils.get_iris_dataset_np()
+
+    train = ArrayDataset(x_train, y_train)
+    test = ArrayDataset(x_test, y_test)
+    data = Data(train, test)
+    with pytest.raises(ValueError):
+        model = BlackboxClassifierPredictions(data, ModelOutputType.CLASSIFIER_PROBABILITIES)
+
+
 def test_blackbox_classifier_no_test():
     (x_train, y_train), (_, _) = dataset_utils.get_iris_dataset_np()
 
     train = ArrayDataset(x_train, y_train)
 
     data = Data(train)
-    model = BlackboxClassifierPredictions(data, ModelOutputType.CLASSIFIER_PROBABILITIES)
+    model = BlackboxClassifierPredictions(data, ModelOutputType.CLASSIFIER_SCALAR)
     pred = model.predict(train)
     assert(pred.shape[0] == x_train.shape[0])
 
@@ -100,7 +111,7 @@ def test_blackbox_classifier_no_train():
 
     test = ArrayDataset(x_test, y_test)
     data = Data(test=test)
-    model = BlackboxClassifierPredictions(data, ModelOutputType.CLASSIFIER_PROBABILITIES)
+    model = BlackboxClassifierPredictions(data, ModelOutputType.CLASSIFIER_SCALAR)
     pred = model.predict(test)
     assert(pred.shape[0] == x_test.shape[0])
 
@@ -114,7 +125,7 @@ def test_blackbox_classifier_no_test_y():
     train = ArrayDataset(x_train, y_train)
     test = ArrayDataset(x_test)
     data = Data(train, test)
-    model = BlackboxClassifierPredictions(data, ModelOutputType.CLASSIFIER_PROBABILITIES)
+    model = BlackboxClassifierPredictions(data, ModelOutputType.CLASSIFIER_SCALAR)
     pred = model.predict(train)
     assert(pred.shape[0] == x_train.shape[0])
 
@@ -136,7 +147,7 @@ def test_blackbox_classifier_no_train_y():
     train = ArrayDataset(x_train)
     test = ArrayDataset(x_test, y_test)
     data = Data(train, test)
-    model = BlackboxClassifierPredictions(data, ModelOutputType.CLASSIFIER_PROBABILITIES)
+    model = BlackboxClassifierPredictions(data, ModelOutputType.CLASSIFIER_SCALAR)
     pred = model.predict(test)
     assert (pred.shape[0] == x_test.shape[0])
 
@@ -171,7 +182,7 @@ def test_blackbox_classifier_probabilities():
 
 def test_blackbox_classifier_predict():
     def predict(x):
-        return [0.23, 0.56, 0.21]
+        return np.array([[0.23, 0.56, 0.21] for i in range(x.shape[0])])
 
     (x_train, y_train), (_, _) = dataset_utils.get_iris_dataset_np()
     y_train = np.array([[0.23, 0.56, 0.21] for i in range(105)])
@@ -187,6 +198,7 @@ def test_blackbox_classifier_predict():
     score = model.score(train)
     assert (score == 1.0)
 
+
 def test_is_one_hot():
     (_, y_train), (_, _) = dataset_utils.get_iris_dataset_np()
 

From a7d156660eae6c2cf3bf2030f41caa2f16a74441 Mon Sep 17 00:00:00 2001
From: abigailt <abigailt@il.ibm.com>
Date: Wed, 20 Jul 2022 11:39:13 +0300
Subject: [PATCH 22/26] Wrap predict method in BlackBoxClassifierPredictMethod
 to avoid exception in ART when supplied method returns scalars

---
 apt/utils/models/model.py |  9 ++++++++-
 tests/test_model.py       | 18 ++++++++++++++++++
 2 files changed, 26 insertions(+), 1 deletion(-)

diff --git a/apt/utils/models/model.py b/apt/utils/models/model.py
index 902a22c..e81bc89 100644
--- a/apt/utils/models/model.py
+++ b/apt/utils/models/model.py
@@ -340,4 +340,11 @@ class BlackboxClassifierPredictFunction(BlackboxClassifier):
         super().__init__(model, output_type, black_box_access=True, unlimited_queries=unlimited_queries, **kwargs)
         self._nb_classes = nb_classes
         self._input_shape = input_shape
-        self._art_model = BlackBoxClassifier(model, self._input_shape, self._nb_classes, preprocessing=None)
+
+        def predict_wrapper(x):
+            predictions = self.model(x)
+            if not is_one_hot(predictions):
+                predictions = check_and_transform_label_format(predictions, nb_classes=nb_classes, return_one_hot=True)
+            return predictions
+
+        self._art_model = BlackBoxClassifier(predict_wrapper, self._input_shape, self._nb_classes, preprocessing=None)
diff --git a/tests/test_model.py b/tests/test_model.py
index 8b4769c..7ad260d 100644
--- a/tests/test_model.py
+++ b/tests/test_model.py
@@ -199,6 +199,23 @@ def test_blackbox_classifier_predict():
     assert (score == 1.0)
 
 
+def test_blackbox_classifier_predict_scalar():
+    def predict(x):
+        return np.array([[1.0] for i in range(x.shape[0])])
+
+    (x_train, y_train), (_, _) = dataset_utils.get_iris_dataset_np()
+    y_train = np.array([[0, 1, 0] for i in range(105)])
+
+    train = ArrayDataset(x_train, y_train)
+
+    model = BlackboxClassifierPredictFunction(predict, ModelOutputType.CLASSIFIER_SCALAR, (4,), 3)
+    pred = model.predict(train)
+    assert (pred.shape[0] == x_train.shape[0])
+
+    score = model.score(train)
+    assert (score == 1.0)
+
+
 def test_is_one_hot():
     (_, y_train), (_, _) = dataset_utils.get_iris_dataset_np()
 
@@ -206,6 +223,7 @@ def test_is_one_hot():
     assert (not is_one_hot(y_train.reshape(-1,1)))
     assert (is_one_hot(to_categorical(y_train)))
 
+
 def test_get_nb_classes():
     (_, y_train), (_, y_test) = dataset_utils.get_iris_dataset_np()
 

From 77a6e08c8e7f0c0ce5f4380a1a607a5acf0bce38 Mon Sep 17 00:00:00 2001
From: abigailt <abigailt@il.ibm.com>
Date: Wed, 20 Jul 2022 14:17:25 +0300
Subject: [PATCH 23/26] Keras regression support

---
 apt/utils/models/__init__.py    |   2 +-
 apt/utils/models/keras_model.py | 120 ++++++++++++++++----------------
 requirements.txt                |   2 +-
 tests/test_model.py             |  24 ++++++-
 4 files changed, 85 insertions(+), 63 deletions(-)

diff --git a/apt/utils/models/__init__.py b/apt/utils/models/__init__.py
index 65861f3..e458139 100644
--- a/apt/utils/models/__init__.py
+++ b/apt/utils/models/__init__.py
@@ -2,4 +2,4 @@ from apt.utils.models.model import Model, BlackboxClassifier, ModelOutputType, S
     BlackboxClassifierPredictions, BlackboxClassifierPredictFunction, get_nb_classes, is_one_hot, \
     check_correct_model_output
 from apt.utils.models.sklearn_model import SklearnModel, SklearnClassifier, SklearnRegressor
-from apt.utils.models.keras_model import KerasClassifier
+from apt.utils.models.keras_model import KerasClassifier, KerasRegressor
diff --git a/apt/utils/models/keras_model.py b/apt/utils/models/keras_model.py
index 6bce043..2f01385 100644
--- a/apt/utils/models/keras_model.py
+++ b/apt/utils/models/keras_model.py
@@ -7,12 +7,14 @@ import tensorflow as tf
 from tensorflow import keras
 tf.compat.v1.disable_eager_execution()
 
+from sklearn.metrics import mean_squared_error
+
 from apt.utils.models import Model, ModelOutputType, ScoringMethod, check_correct_model_output
 from apt.utils.datasets import Dataset, OUTPUT_DATA_ARRAY_TYPE
 
 from art.utils import check_and_transform_label_format
 from art.estimators.classification.keras import KerasClassifier as ArtKerasClassifier
-# from art.estimators.regression.keras import KerasRegressor as ArtKerasRegressor
+from art.estimators.regression.keras import KerasRegressor as ArtKerasRegressor
 
 
 class KerasModel(Model):
@@ -90,62 +92,60 @@ class KerasClassifier(KerasModel):
             raise NotImplementedError
 
 
-# class KerasRegressor(KerasModel):
-#     """
-#     Wrapper class for keras regression models.
-#
-#     :param model: The original keras model object.
-#     :type model: `keras.models.Model`
-#     :param black_box_access: Boolean describing the type of deployment of the model (when in production).
-#                              Set to True if the model is only available via query (API) access, i.e.,
-#                              only the outputs of the model are exposed, and False if the model internals
-#                              are also available. Default is True.
-#     :type black_box_access: boolean, optional
-#     :param unlimited_queries: If black_box_access is True, this boolean indicates whether a user can perform
-#                               unlimited queries to the model API or whether there is a limit to the number of
-#                               queries that can be submitted. Default is True.
-#     :type unlimited_queries: boolean, optional
-#     """
-#     def __init__(self, model: keras.models.Model, black_box_access: Optional[bool] = True,
-#                  unlimited_queries: Optional[bool] = True, **kwargs):
-#         super().__init__(model, ModelOutputType.REGRESSOR_SCALAR, black_box_access, unlimited_queries, **kwargs)
-#         self._art_model = ArtKerasRegressor(model)
-#
-#     def fit(self, train_data: Dataset, **kwargs) -> None:
-#         """
-#         Fit the model using the training data.
-#
-#         :param train_data: Training data.
-#         :type train_data: `Dataset`
-#         :return: None
-#         """
-#         self._art_model.fit(train_data.get_samples(), train_data.get_labels(), **kwargs)
-#
-#     def predict(self, x: Dataset, **kwargs) -> OUTPUT_DATA_ARRAY_TYPE:
-#         """
-#         Perform predictions using the model for input `x`.
-#
-#         :param x: Input samples.
-#         :type x: `Dataset`
-#         :return: Predictions from the model as numpy array.
-#         """
-#         return self._art_model.predict(x.get_samples(), **kwargs)
-#
-#     def score(self, test_data: Dataset, scoring_method: Optional[ScoringMethod] = ScoringMethod.MEAN_SQUARED_ERROR,
-#               **kwargs):
-#         """
-#         Score the model using test data.
-#
-#         :param test_data: Test data.
-#         :type train_data: `Dataset`
-#         :param scoring_method: The method for scoring predictions. Default is ACCURACY.
-#         :type scoring_method: `ScoringMethod`, optional
-#         :return: the score as float
-#         """
-#         y = check_and_transform_label_format(test_data.get_labels(), self._art_model.nb_classes)
-#         predicted = self.predict(test_data)
-#         if scoring_method == ScoringMethod.MEAN_SQUARED_ERROR:
-#             mse = keras.losses.MeanSquaredError(reduction=keras.losses.Reduction.SUM)
-#             return mse(y, predicted).numpy()
-#         else:
-#             raise NotImplementedError('Only MEAN_SQUARED_ERROR supported as scoring method')
+class KerasRegressor(KerasModel):
+    """
+    Wrapper class for keras regression models.
+
+    :param model: The original keras model object.
+    :type model: `keras.models.Model`
+    :param black_box_access: Boolean describing the type of deployment of the model (when in production).
+                             Set to True if the model is only available via query (API) access, i.e.,
+                             only the outputs of the model are exposed, and False if the model internals
+                             are also available. Default is True.
+    :type black_box_access: boolean, optional
+    :param unlimited_queries: If black_box_access is True, this boolean indicates whether a user can perform
+                              unlimited queries to the model API or whether there is a limit to the number of
+                              queries that can be submitted. Default is True.
+    :type unlimited_queries: boolean, optional
+    """
+    def __init__(self, model: keras.models.Model, black_box_access: Optional[bool] = True,
+                 unlimited_queries: Optional[bool] = True, **kwargs):
+        super().__init__(model, ModelOutputType.REGRESSOR_SCALAR, black_box_access, unlimited_queries, **kwargs)
+        self._art_model = ArtKerasRegressor(model)
+
+    def fit(self, train_data: Dataset, **kwargs) -> None:
+        """
+        Fit the model using the training data.
+
+        :param train_data: Training data.
+        :type train_data: `Dataset`
+        :return: None
+        """
+        self._art_model.fit(train_data.get_samples(), train_data.get_labels(), **kwargs)
+
+    def predict(self, x: Dataset, **kwargs) -> OUTPUT_DATA_ARRAY_TYPE:
+        """
+        Perform predictions using the model for input `x`.
+
+        :param x: Input samples.
+        :type x: `Dataset`
+        :return: Predictions from the model as numpy array.
+        """
+        return self._art_model.predict(x.get_samples(), **kwargs)
+
+    def score(self, test_data: Dataset, scoring_method: Optional[ScoringMethod] = ScoringMethod.MEAN_SQUARED_ERROR,
+              **kwargs):
+        """
+        Score the model using test data.
+
+        :param test_data: Test data.
+        :type train_data: `Dataset`
+        :param scoring_method: The method for scoring predictions. Default is ACCURACY.
+        :type scoring_method: `ScoringMethod`, optional
+        :return: the score as float
+        """
+        predicted = self.predict(test_data)
+        if scoring_method == ScoringMethod.MEAN_SQUARED_ERROR:
+            return mean_squared_error(test_data.get_labels(), predicted)
+        else:
+            raise NotImplementedError('Only MEAN_SQUARED_ERROR supported as scoring method')
diff --git a/requirements.txt b/requirements.txt
index 4ce8d46..849ca96 100644
--- a/requirements.txt
+++ b/requirements.txt
@@ -3,7 +3,7 @@ pandas==1.1.0
 scipy==1.4.1
 scikit-learn==0.22.2
 torch>=1.8.0
-adversarial-robustness-toolbox>=1.10.1
+adversarial-robustness-toolbox>=1.11.0
 
 # testing
 pytest==5.4.2
diff --git a/tests/test_model.py b/tests/test_model.py
index 7ad260d..d5f4216 100644
--- a/tests/test_model.py
+++ b/tests/test_model.py
@@ -1,7 +1,7 @@
 import pytest
 import numpy as np
 
-from apt.utils.models import SklearnClassifier, SklearnRegressor, ModelOutputType, KerasClassifier, \
+from apt.utils.models import SklearnClassifier, SklearnRegressor, ModelOutputType, KerasClassifier, KerasRegressor, \
     BlackboxClassifierPredictions, BlackboxClassifierPredictFunction, is_one_hot, get_nb_classes
 from apt.utils.datasets import ArrayDataset, Data
 from apt.utils import dataset_utils
@@ -66,6 +66,28 @@ def test_keras_classifier():
     assert(0.0 <= score <= 1.0)
 
 
+def test_keras_regressor():
+    (x_train, y_train), (x_test, y_test) = dataset_utils.get_diabetes_dataset_np()
+
+    underlying_model = Sequential()
+    underlying_model.add(Input(shape=(10,)))
+    underlying_model.add(Dense(100, activation="relu"))
+    underlying_model.add(Dense(10, activation="relu"))
+    underlying_model.add(Dense(1))
+
+    underlying_model.compile(loss="mean_squared_error", optimizer="adam", metrics=["accuracy"])
+
+    model = KerasRegressor(underlying_model)
+
+    train = ArrayDataset(x_train, y_train)
+    test = ArrayDataset(x_test, y_test)
+    model.fit(train)
+    pred = model.predict(test)
+    assert (pred.shape[0] == x_test.shape[0])
+
+    score = model.score(test)
+
+
 def test_blackbox_classifier():
     (x_train, y_train), (x_test, y_test) = dataset_utils.get_iris_dataset_np()
 

From fb534f7a0fd0d62acf5955ffd8076edabc725782 Mon Sep 17 00:00:00 2001
From: abigailt <abigailt@il.ibm.com>
Date: Sun, 24 Jul 2022 21:05:12 +0300
Subject: [PATCH 24/26] BlackboxClassifier based on predictions to work with
 DatasetWithPredictions

---
 apt/utils/datasets/datasets.py | 26 +++++++++++++++++++++++---
 apt/utils/models/model.py      | 10 ++++++++--
 tests/test_model.py            | 33 ++++++++++++++++++++++++++++++++-
 3 files changed, 63 insertions(+), 6 deletions(-)

diff --git a/apt/utils/datasets/datasets.py b/apt/utils/datasets/datasets.py
index 0ebc998..7eae95f 100644
--- a/apt/utils/datasets/datasets.py
+++ b/apt/utils/datasets/datasets.py
@@ -477,7 +477,7 @@ class Data:
 
     def get_train_samples(self) -> Collection[Any]:
         """
-        Get train set samples
+        Get train set samples, or None if no training data provided
 
         :return: training samples
         """
@@ -487,7 +487,7 @@ class Data:
 
     def get_train_labels(self) -> Collection[Any]:
         """
-        Get train set labels
+        Get train set labels, or None if no training labels provided
 
         :return: training labels
         """
@@ -495,6 +495,16 @@ class Data:
             return None
         return self.train.get_labels()
 
+    def get_train_predictions(self) -> Collection[Any]:
+        """
+        Get train set predictions, or None if no training predictions provided
+
+        :return: training labels
+        """
+        if self.train is None:
+            return None
+        return self.train.get_predictions()
+
     def get_test_samples(self) -> Collection[Any]:
         """
         Get test set samples
@@ -509,8 +519,18 @@ class Data:
         """
         Get test set labels
 
-        :return: test labels, or None if no test data provided
+        :return: test labels, or None if no test labels provided
         """
         if self.test is None:
             return None
         return self.test.get_labels()
+
+    def get_test_predictions(self) -> Collection[Any]:
+        """
+        Get test set predictions, or None if no test predictions provided
+
+        :return: test labels
+        """
+        if self.test is None:
+            return None
+        return self.test.get_predictions()
diff --git a/apt/utils/models/model.py b/apt/utils/models/model.py
index e81bc89..d9811e1 100644
--- a/apt/utils/models/model.py
+++ b/apt/utils/models/model.py
@@ -246,6 +246,8 @@ class BlackboxClassifier(Model):
         :type scoring_method: `ScoringMethod`, optional
         :return: the score as float (for classifiers, between 0 and 1)
         """
+        if test_data.get_samples() is None or test_data.get_labels() is None:
+            raise ValueError('score can only be computed when test data and labels are available')
         predicted = self._art_model.predict(test_data.get_samples())
         y = check_and_transform_label_format(test_data.get_labels(), nb_classes=self._nb_classes)
         if scoring_method == ScoringMethod.ACCURACY:
@@ -276,9 +278,13 @@ class BlackboxClassifierPredictions(BlackboxClassifier):
                  unlimited_queries: Optional[bool] = True, **kwargs):
         super().__init__(model, output_type, black_box_access=True, unlimited_queries=False, **kwargs)
         x_train_pred = model.get_train_samples()
-        y_train_pred = model.get_train_labels()
+        y_train_pred = model.get_train_predictions()
+        if y_train_pred is None:
+            y_train_pred = model.get_train_labels()
         x_test_pred = model.get_test_samples()
-        y_test_pred = model.get_test_labels()
+        y_test_pred = model.get_test_predictions()
+        if y_test_pred is None:
+            y_test_pred = model.get_test_labels()
 
         if y_train_pred is not None:
             check_correct_model_output(y_train_pred, self.output_type)
diff --git a/tests/test_model.py b/tests/test_model.py
index d5f4216..821c776 100644
--- a/tests/test_model.py
+++ b/tests/test_model.py
@@ -3,7 +3,7 @@ import numpy as np
 
 from apt.utils.models import SklearnClassifier, SklearnRegressor, ModelOutputType, KerasClassifier, KerasRegressor, \
     BlackboxClassifierPredictions, BlackboxClassifierPredictFunction, is_one_hot, get_nb_classes
-from apt.utils.datasets import ArrayDataset, Data
+from apt.utils.datasets import ArrayDataset, Data, DatasetWithPredictions
 from apt.utils import dataset_utils
 
 from sklearn.tree import DecisionTreeRegressor
@@ -104,6 +104,37 @@ def test_blackbox_classifier():
     assert model.model_type is None
 
 
+def test_blackbox_classifier_predictions():
+    (x_train, y_train), (x_test, y_test) = dataset_utils.get_iris_dataset_np()
+
+    train = DatasetWithPredictions(y_train, x_train)
+    test = DatasetWithPredictions(y_test, x_test)
+    data = Data(train, test)
+    model = BlackboxClassifierPredictions(data, ModelOutputType.CLASSIFIER_SCALAR)
+    pred = model.predict(test)
+    assert(pred.shape[0] == x_test.shape[0])
+    assert model.model_type is None
+
+    with pytest.raises(ValueError):
+        model.score(test)
+
+
+def test_blackbox_classifier_predictions_y():
+    (x_train, y_train), (x_test, y_test) = dataset_utils.get_iris_dataset_np()
+
+    train = DatasetWithPredictions(y_train, x_train, y_train)
+    test = DatasetWithPredictions(y_test, x_test, y_test)
+    data = Data(train, test)
+    model = BlackboxClassifierPredictions(data, ModelOutputType.CLASSIFIER_SCALAR)
+    pred = model.predict(test)
+    assert(pred.shape[0] == x_test.shape[0])
+
+    score = model.score(test)
+    assert(score == 1.0)
+
+    assert model.model_type is None
+
+
 def test_blackbox_classifier_mismatch():
     (x_train, y_train), (x_test, y_test) = dataset_utils.get_iris_dataset_np()
 

From a13415ad67af786b2d38c991020a9eb401febbb9 Mon Sep 17 00:00:00 2001
From: abigailt <abigailt@il.ibm.com>
Date: Mon, 25 Jul 2022 15:47:04 +0300
Subject: [PATCH 25/26] Externalize BlackboxClassifier dataset (x and
 predictions)

---
 apt/utils/models/model.py | 10 ++++++++++
 tests/test_model.py       | 10 ++++++++++
 2 files changed, 20 insertions(+)

diff --git a/apt/utils/models/model.py b/apt/utils/models/model.py
index d9811e1..06cae10 100644
--- a/apt/utils/models/model.py
+++ b/apt/utils/models/model.py
@@ -316,10 +316,20 @@ class BlackboxClassifierPredictions(BlackboxClassifier):
 
         self._nb_classes = get_nb_classes(y_pred)
         self._input_shape = x_pred.shape[1:]
+        self._x_pred = x_pred
+        self._y_pred = y_pred
         predict_fn = (x_pred, y_pred)
         self._art_model = BlackBoxClassifier(predict_fn, self._input_shape, self._nb_classes, fuzzy_float_compare=True,
                                              preprocessing=None)
 
+    def get_predictions(self) -> Tuple[OUTPUT_DATA_ARRAY_TYPE, OUTPUT_DATA_ARRAY_TYPE]:
+        """
+        Return all the data for which the model contains predictions.
+
+        :return: Tuple containing data and predictions as numpy arrays.
+        """
+        return self._x_pred, self._y_pred
+
 
 class BlackboxClassifierPredictFunction(BlackboxClassifier):
     """
diff --git a/tests/test_model.py b/tests/test_model.py
index 821c776..21c8fff 100644
--- a/tests/test_model.py
+++ b/tests/test_model.py
@@ -12,6 +12,8 @@ from sklearn.ensemble import RandomForestClassifier
 from tensorflow.keras.models import Sequential
 from tensorflow.keras.layers import Dense, Input
 
+from art.utils import check_and_transform_label_format
+
 
 from art.utils import to_categorical
 
@@ -158,6 +160,10 @@ def test_blackbox_classifier_no_test():
     score = model.score(train)
     assert (score == 1.0)
 
+    predictions_x, predictions_y = model.get_predictions()
+    assert np.array_equal(predictions_x, x_train)
+    assert np.array_equal(predictions_y, check_and_transform_label_format(y_train, nb_classes=3))
+
 
 def test_blackbox_classifier_no_train():
     (_, _), (x_test, y_test) = dataset_utils.get_iris_dataset_np()
@@ -171,6 +177,10 @@ def test_blackbox_classifier_no_train():
     score = model.score(test)
     assert (score == 1.0)
 
+    predictions_x, predictions_y = model.get_predictions()
+    assert np.array_equal(predictions_x, x_test)
+    assert np.array_equal(predictions_y, check_and_transform_label_format(y_test, nb_classes=3))
+
 
 def test_blackbox_classifier_no_test_y():
     (x_train, y_train), (x_test, _) = dataset_utils.get_iris_dataset_np()

From a9e2a35e18d9e01cc6cd223b8e27f40025012c9e Mon Sep 17 00:00:00 2001
From: abigailt <abigailt@il.ibm.com>
Date: Thu, 28 Jul 2022 16:31:08 +0300
Subject: [PATCH 26/26] Add support for xgboost XGBClassifier (#53)

---
 apt/utils/models/__init__.py      |  1 +
 apt/utils/models/xgboost_model.py | 87 +++++++++++++++++++++++++++++++
 tests/test_model.py               | 19 ++++++-
 3 files changed, 106 insertions(+), 1 deletion(-)
 create mode 100644 apt/utils/models/xgboost_model.py

diff --git a/apt/utils/models/__init__.py b/apt/utils/models/__init__.py
index e458139..ff582b4 100644
--- a/apt/utils/models/__init__.py
+++ b/apt/utils/models/__init__.py
@@ -3,3 +3,4 @@ from apt.utils.models.model import Model, BlackboxClassifier, ModelOutputType, S
     check_correct_model_output
 from apt.utils.models.sklearn_model import SklearnModel, SklearnClassifier, SklearnRegressor
 from apt.utils.models.keras_model import KerasClassifier, KerasRegressor
+from apt.utils.models.xgboost_model import XGBoostClassifier
diff --git a/apt/utils/models/xgboost_model.py b/apt/utils/models/xgboost_model.py
new file mode 100644
index 0000000..1ea02e7
--- /dev/null
+++ b/apt/utils/models/xgboost_model.py
@@ -0,0 +1,87 @@
+from typing import Optional, Tuple
+
+from apt.utils.models import Model, ModelOutputType, ScoringMethod, check_correct_model_output, is_one_hot
+from apt.utils.datasets import Dataset, OUTPUT_DATA_ARRAY_TYPE
+
+from xgboost import XGBClassifier
+import numpy as np
+
+from art.estimators.classification.xgboost import XGBoostClassifier as ArtXGBoostClassifier
+
+
+class XGBoostModel(Model):
+    """
+    Wrapper class for xgboost models.
+    """
+
+
+class XGBoostClassifier(XGBoostModel):
+    """
+    Wrapper class for xgboost classification models.
+
+    :param model: The original xgboost model object. Must be fit.
+    :type model: Booster or XGBClassifier object
+    :param output_type: The type of output the model yields (vector/label only)
+    :type output_type: `ModelOutputType`
+    :param input_shape: Shape of input to the model.
+    :type input_shape: Tuple[int, ...]
+    :param nb_classes: Number of prediction classes of the model.
+    :type  nb_classes: int
+    :param black_box_access: Boolean describing the type of deployment of the model (when in production).
+                             Set to True if the model is only available via query (API) access, i.e.,
+                             only the outputs of the model are exposed, and False if the model internals
+                             are also available. Default is True.
+    :type black_box_access: boolean, optional
+    :param unlimited_queries: If black_box_access is True, this boolean indicates whether a user can perform
+                              unlimited queries to the model API or whether there is a limit to the number of
+                              queries that can be submitted. Default is True.
+    :type unlimited_queries: boolean, optional
+    """
+    def __init__(self, model: XGBClassifier, output_type: ModelOutputType, input_shape: Tuple[int, ...],
+                 nb_classes: int,black_box_access: Optional[bool] = True,
+                 unlimited_queries: Optional[bool] = True, **kwargs):
+        super().__init__(model, output_type, black_box_access, unlimited_queries, **kwargs)
+        self._art_model = ArtXGBoostClassifier(model, nb_features=input_shape[0], nb_classes=nb_classes)
+        self.nb_classes = nb_classes
+
+    def fit(self, train_data: Dataset, **kwargs) -> None:
+        """
+        Fit the model using the training data.
+
+        :param train_data: Training data. Labels are expected to either be one-hot encoded or a 1D-array of categorical
+                           labels (consecutive integers starting at 0).
+        :type train_data: `Dataset`
+        :return: None
+        """
+        self._art_model._model.fit(train_data.get_samples(), train_data.get_labels())
+
+    def predict(self, x: Dataset, **kwargs) -> OUTPUT_DATA_ARRAY_TYPE:
+        """
+        Perform predictions using the model for input `x`.
+
+        :param x: Input samples.
+        :type x: `Dataset`
+        :return: Predictions from the model as numpy array (class probabilities, if supported).
+        """
+        predictions = self._art_model.predict(x.get_samples(), **kwargs)
+        check_correct_model_output(predictions, self.output_type)
+        return predictions
+
+    def score(self, test_data: Dataset, scoring_method: Optional[ScoringMethod] = ScoringMethod.ACCURACY, **kwargs):
+        """
+        Score the model using test data.
+
+        :param test_data: Test data.
+        :type train_data: `Dataset`
+        :return: the score as float (for classifiers, between 0 and 1)
+        """
+        y = test_data.get_labels()
+        predicted = self.predict(test_data)
+        if is_one_hot(predicted):
+            predicted = np.argmax(predicted, axis=1)
+        if is_one_hot(y):
+            y = np.argmax(y, axis=1)
+        if scoring_method == ScoringMethod.ACCURACY:
+            return np.count_nonzero(y == predicted) / predicted.shape[0]
+        else:
+            raise NotImplementedError
diff --git a/tests/test_model.py b/tests/test_model.py
index 21c8fff..c182c59 100644
--- a/tests/test_model.py
+++ b/tests/test_model.py
@@ -2,12 +2,13 @@ import pytest
 import numpy as np
 
 from apt.utils.models import SklearnClassifier, SklearnRegressor, ModelOutputType, KerasClassifier, KerasRegressor, \
-    BlackboxClassifierPredictions, BlackboxClassifierPredictFunction, is_one_hot, get_nb_classes
+    BlackboxClassifierPredictions, BlackboxClassifierPredictFunction, is_one_hot, get_nb_classes, XGBoostClassifier
 from apt.utils.datasets import ArrayDataset, Data, DatasetWithPredictions
 from apt.utils import dataset_utils
 
 from sklearn.tree import DecisionTreeRegressor
 from sklearn.ensemble import RandomForestClassifier
+from xgboost import XGBClassifier
 
 from tensorflow.keras.models import Sequential
 from tensorflow.keras.layers import Dense, Input
@@ -90,6 +91,22 @@ def test_keras_regressor():
     score = model.score(test)
 
 
+def test_xgboost_classifier():
+    (x_train, y_train), (x_test, y_test) = dataset_utils.get_iris_dataset_np()
+    underlying_model = XGBClassifier()
+    underlying_model.fit(x_train, y_train)
+    model = XGBoostClassifier(underlying_model, ModelOutputType.CLASSIFIER_PROBABILITIES, input_shape=(4,), nb_classes=3)
+    train = ArrayDataset(x_train, y_train)
+    test = ArrayDataset(x_test, y_test)
+    pred = model.predict(test)
+    assert(pred.shape[0] == x_test.shape[0])
+
+    score = model.score(test)
+    assert(0.0 <= score <= 1.0)
+
+    model.fit(train)
+
+
 def test_blackbox_classifier():
     (x_train, y_train), (x_test, y_test) = dataset_utils.get_iris_dataset_np()