2022-04-27 12:33:27 +03:00
|
|
|
import pytest
|
2022-06-30 18:23:53 +03:00
|
|
|
import numpy as np
|
2022-04-27 12:33:27 +03:00
|
|
|
|
2022-06-30 18:23:53 +03:00
|
|
|
from apt.utils.models import SklearnClassifier, SklearnRegressor, ModelOutputType, KerasClassifier, \
|
|
|
|
|
BlackboxClassifierPredictions, BlackboxClassifierPredictFunction
|
2022-05-12 15:44:29 +03:00
|
|
|
from apt.utils.datasets import ArrayDataset, Data
|
2022-04-27 12:33:27 +03:00
|
|
|
from apt.utils import dataset_utils
|
|
|
|
|
|
|
|
|
|
from sklearn.tree import DecisionTreeRegressor
|
|
|
|
|
from sklearn.ensemble import RandomForestClassifier
|
|
|
|
|
|
2022-05-12 15:44:29 +03:00
|
|
|
from tensorflow.keras.models import Sequential
|
|
|
|
|
from tensorflow.keras.layers import Dense, Input
|
|
|
|
|
|
2022-04-27 12:33:27 +03:00
|
|
|
|
|
|
|
|
def test_sklearn_classifier():
|
2022-05-12 15:44:29 +03:00
|
|
|
(x_train, y_train), (x_test, y_test) = dataset_utils.get_iris_dataset_np()
|
2022-04-27 12:33:27 +03:00
|
|
|
underlying_model = RandomForestClassifier()
|
2022-05-12 15:44:29 +03:00
|
|
|
model = SklearnClassifier(underlying_model, ModelOutputType.CLASSIFIER_PROBABILITIES)
|
2022-04-27 12:33:27 +03:00
|
|
|
train = ArrayDataset(x_train, y_train)
|
|
|
|
|
test = ArrayDataset(x_test, y_test)
|
|
|
|
|
model.fit(train)
|
2022-05-12 15:44:29 +03:00
|
|
|
pred = model.predict(test)
|
2022-04-27 12:33:27 +03:00
|
|
|
assert(pred.shape[0] == x_test.shape[0])
|
|
|
|
|
|
|
|
|
|
score = model.score(test)
|
|
|
|
|
assert(0.0 <= score <= 1.0)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
def test_sklearn_regressor():
|
2022-05-12 15:44:29 +03:00
|
|
|
(x_train, y_train), (x_test, y_test) = dataset_utils.get_diabetes_dataset_np()
|
2022-04-27 12:33:27 +03:00
|
|
|
underlying_model = DecisionTreeRegressor()
|
|
|
|
|
model = SklearnRegressor(underlying_model)
|
|
|
|
|
train = ArrayDataset(x_train, y_train)
|
|
|
|
|
test = ArrayDataset(x_test, y_test)
|
|
|
|
|
model.fit(train)
|
2022-05-12 15:44:29 +03:00
|
|
|
pred = model.predict(test)
|
2022-04-27 12:33:27 +03:00
|
|
|
assert (pred.shape[0] == x_test.shape[0])
|
|
|
|
|
|
|
|
|
|
score = model.score(test)
|
2022-05-12 15:44:29 +03:00
|
|
|
|
|
|
|
|
|
|
|
|
|
def test_keras_classifier():
|
|
|
|
|
(x_train, y_train), (x_test, y_test) = dataset_utils.get_iris_dataset_np()
|
|
|
|
|
|
|
|
|
|
underlying_model = Sequential()
|
|
|
|
|
underlying_model.add(Input(shape=(4,)))
|
|
|
|
|
underlying_model.add(Dense(100, activation="relu"))
|
|
|
|
|
underlying_model.add(Dense(10, activation="relu"))
|
|
|
|
|
underlying_model.add(Dense(3, activation='softmax'))
|
|
|
|
|
|
|
|
|
|
underlying_model.compile(loss="categorical_crossentropy", optimizer="adam", metrics=["accuracy"])
|
|
|
|
|
|
|
|
|
|
model = KerasClassifier(underlying_model, ModelOutputType.CLASSIFIER_PROBABILITIES)
|
|
|
|
|
|
|
|
|
|
train = ArrayDataset(x_train, y_train)
|
|
|
|
|
test = ArrayDataset(x_test, y_test)
|
|
|
|
|
model.fit(train)
|
|
|
|
|
pred = model.predict(test)
|
|
|
|
|
assert(pred.shape[0] == x_test.shape[0])
|
|
|
|
|
|
|
|
|
|
score = model.score(test)
|
|
|
|
|
assert(0.0 <= score <= 1.0)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
def test_blackbox_classifier():
|
|
|
|
|
(x_train, y_train), (x_test, y_test) = dataset_utils.get_iris_dataset_np()
|
|
|
|
|
|
|
|
|
|
train = ArrayDataset(x_train, y_train)
|
|
|
|
|
test = ArrayDataset(x_test, y_test)
|
|
|
|
|
data = Data(train, test)
|
2022-06-30 18:23:53 +03:00
|
|
|
model = BlackboxClassifierPredictions(data, ModelOutputType.CLASSIFIER_PROBABILITIES)
|
2022-05-12 15:44:29 +03:00
|
|
|
pred = model.predict(test)
|
|
|
|
|
assert(pred.shape[0] == x_test.shape[0])
|
|
|
|
|
|
|
|
|
|
score = model.score(test)
|
|
|
|
|
assert(0.0 <= score <= 1.0)
|
2022-06-26 14:43:22 +03:00
|
|
|
|
|
|
|
|
def test_blackbox_classifier_no_test():
|
|
|
|
|
(x_train, y_train), (_, _) = dataset_utils.get_iris_dataset_np()
|
|
|
|
|
|
|
|
|
|
train = ArrayDataset(x_train, y_train)
|
|
|
|
|
|
|
|
|
|
data = Data(train)
|
2022-06-30 18:23:53 +03:00
|
|
|
model = BlackboxClassifierPredictions(data, ModelOutputType.CLASSIFIER_PROBABILITIES)
|
2022-06-26 14:43:22 +03:00
|
|
|
pred = model.predict(train)
|
|
|
|
|
assert(pred.shape[0] == x_train.shape[0])
|
|
|
|
|
|
|
|
|
|
score = model.score(train)
|
|
|
|
|
assert(0.0 <= score <= 1.0)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
def test_blackbox_classifier_no_train():
|
|
|
|
|
(_, _), (x_test, y_test) = dataset_utils.get_iris_dataset_np()
|
|
|
|
|
|
|
|
|
|
test = ArrayDataset(x_test, y_test)
|
|
|
|
|
data = Data(test=test)
|
2022-06-30 18:23:53 +03:00
|
|
|
model = BlackboxClassifierPredictions(data, ModelOutputType.CLASSIFIER_PROBABILITIES)
|
2022-06-26 14:43:22 +03:00
|
|
|
pred = model.predict(test)
|
|
|
|
|
assert(pred.shape[0] == x_test.shape[0])
|
|
|
|
|
|
|
|
|
|
score = model.score(test)
|
|
|
|
|
assert(0.0 <= score <= 1.0)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
def test_blackbox_classifier_no_test_y():
|
|
|
|
|
(x_train, y_train), (x_test, _) = dataset_utils.get_iris_dataset_np()
|
|
|
|
|
|
|
|
|
|
train = ArrayDataset(x_train, y_train)
|
|
|
|
|
test = ArrayDataset(x_test)
|
|
|
|
|
data = Data(train, test)
|
2022-06-30 18:23:53 +03:00
|
|
|
model = BlackboxClassifierPredictions(data, ModelOutputType.CLASSIFIER_PROBABILITIES)
|
2022-06-26 14:43:22 +03:00
|
|
|
pred = model.predict(train)
|
|
|
|
|
assert(pred.shape[0] == x_train.shape[0])
|
|
|
|
|
|
|
|
|
|
score = model.score(train)
|
|
|
|
|
assert(0.0 <= score <= 1.0)
|
|
|
|
|
|
|
|
|
|
# since no test_y, BBC should use only test thus predict test should fail
|
|
|
|
|
unable_to_predict_test = False
|
|
|
|
|
try:
|
|
|
|
|
model.predict(test)
|
|
|
|
|
except BaseException:
|
|
|
|
|
unable_to_predict_test = True
|
|
|
|
|
|
|
|
|
|
assert (unable_to_predict_test, True)
|
|
|
|
|
|
|
|
|
|
def test_blackbox_classifier_no_train_y():
|
|
|
|
|
(x_train, _), (x_test, y_test) = dataset_utils.get_iris_dataset_np()
|
|
|
|
|
|
|
|
|
|
train = ArrayDataset(x_train)
|
|
|
|
|
test = ArrayDataset(x_test, y_test)
|
|
|
|
|
data = Data(train, test)
|
2022-06-30 18:23:53 +03:00
|
|
|
model = BlackboxClassifierPredictions(data, ModelOutputType.CLASSIFIER_PROBABILITIES)
|
2022-06-26 14:43:22 +03:00
|
|
|
pred = model.predict(test)
|
|
|
|
|
assert (pred.shape[0] == x_test.shape[0])
|
|
|
|
|
|
|
|
|
|
score = model.score(test)
|
|
|
|
|
assert (0.0 <= score <= 1.0)
|
|
|
|
|
|
|
|
|
|
# since no train_y, BBC should use only test thus predict train should fail
|
|
|
|
|
unable_to_predict_train = False
|
|
|
|
|
try:
|
|
|
|
|
model.predict(train)
|
|
|
|
|
except BaseException:
|
|
|
|
|
unable_to_predict_train = True
|
|
|
|
|
|
|
|
|
|
assert(unable_to_predict_train,True)
|
|
|
|
|
|
2022-06-30 18:23:53 +03:00
|
|
|
def test_blackbox_classifier_probabilities():
|
|
|
|
|
(x_train, _), (_, _) = dataset_utils.get_iris_dataset_np()
|
|
|
|
|
y_train = np.array([[0.23, 0.56, 0.21] for i in range(105)])
|
|
|
|
|
|
|
|
|
|
train = ArrayDataset(x_train, y_train)
|
|
|
|
|
|
|
|
|
|
data = Data(train)
|
|
|
|
|
model = BlackboxClassifierPredictions(data, ModelOutputType.CLASSIFIER_PROBABILITIES)
|
|
|
|
|
pred = model.predict(train)
|
|
|
|
|
assert (pred.shape[0] == x_train.shape[0])
|
|
|
|
|
assert (0.0 < pred).all()
|
|
|
|
|
assert (pred < 1.0).all()
|
|
|
|
|
|
|
|
|
|
score = model.score(train)
|
|
|
|
|
assert (0.0 <= score <= 1.0)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
def test_blackbox_classifier_predict():
|
|
|
|
|
def predict(x):
|
|
|
|
|
return [0.23, 0.56, 0.21]
|
|
|
|
|
|
|
|
|
|
(x_train, y_train), (_, _) = dataset_utils.get_iris_dataset_np()
|
|
|
|
|
|
|
|
|
|
train = ArrayDataset(x_train, y_train)
|
|
|
|
|
|
|
|
|
|
model = BlackboxClassifierPredictFunction(predict, ModelOutputType.CLASSIFIER_PROBABILITIES, (4,), 3)
|
|
|
|
|
pred = model.predict(train)
|
|
|
|
|
assert (pred.shape[0] == x_train.shape[0])
|
|
|
|
|
assert (0.0 < pred).all()
|
|
|
|
|
assert (pred < 1.0).all()
|
|
|
|
|
|
|
|
|
|
score = model.score(train)
|
|
|
|
|
assert (0.0 <= score <= 1.0)
|
|
|
|
|
|
|
|
|
|
|