GPy/GPy/testing/test_plotting.py
2023-10-16 08:30:53 +02:00

703 lines
24 KiB
Python

# ===============================================================================
# Copyright (c) 2015, Max Zwiessele
# All rights reserved.
#
# Redistribution and use in source and binary forms, with or without
# modification, are permitted provided that the following conditions are met:
#
# * Redistributions of source code must retain the above copyright notice, this
# list of conditions and the following disclaimer.
#
# * Redistributions in binary form must reproduce the above copyright notice,
# this list of conditions and the following disclaimer in the documentation
# and/or other materials provided with the distribution.
#
# * Neither the name of GPy nor the names of its
# contributors may be used to endorse or promote products derived from
# this software without specific prior written permission.
#
# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
# AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
# IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
# DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE
# FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
# DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
# SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
# CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
# OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
# OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
# ===============================================================================
# ===============================================================================
# SKIPPING PLOTTING BECAUSE IT BEHAVES DIFFERENTLY ON DIFFERENT
# SYSTEMS, AND WILL MISBEHAVE
# raise SkipTest("Skipping Matplotlib testing")
# ===============================================================================
try:
import matplotlib
from matplotlib import pyplot as plt
from matplotlib.testing.compare import compare_images
matplotlib.use("agg")
except ImportError:
# matplotlib not installed
matplotlib = None
import pytest
import numpy as np
import GPy, os
import logging
from GPy.util.config import config
from GPy.plotting import change_plotting_library, plotting_library
class TestConfig:
def teardown(self):
change_plotting_library("matplotlib")
@pytest.mark.skipif(matplotlib is None, reason="Matplotlib not installed")
def test_change_plotting(self):
with pytest.raises(ValueError):
change_plotting_library("not+in9names")
change_plotting_library("none")
with pytest.raises(RuntimeError):
plotting_library()
self.teardown()
change_plotting_library("matplotlib")
extensions = ["npz"]
basedir = os.path.dirname(os.path.relpath(os.path.abspath(__file__)))
def _image_directories():
"""
Compute the baseline and result image directories for testing *func*.
Create the result directory if it doesn't exist.
"""
# module_name = __init__.__module__
# mods = module_name.split('.')
# basedir = os.path.join(*mods)
result_dir = os.path.join(basedir, "testresult", ".")
baseline_dir = os.path.join(basedir, "baseline", ".")
if not os.path.exists(result_dir):
os.makedirs(result_dir)
return baseline_dir, result_dir
baseline_dir, result_dir = _image_directories()
if not os.path.exists(baseline_dir):
baseline_dir = None
def _image_comparison(
baseline_images, extensions=["pdf", "svg", "png"], tol=11, rtol=1e-3, **kwargs
):
for num, base in zip(plt.get_fignums(), baseline_images):
for ext in extensions:
fig = plt.figure(num)
try:
fig.canvas.draw()
except Exception as e:
logging.error(base)
# raise SkipTest(e)
# fig.axes[0].set_axis_off()
# fig.set_frameon(False)
if ext in ["npz"]:
figdict = flatten_axis(fig)
np.savez_compressed(
os.path.join(result_dir, "{}.{}".format(base, ext)), **figdict
)
try:
fig.savefig(
os.path.join(result_dir, "{}.{}".format(base, "png")),
transparent=True,
edgecolor="none",
facecolor="none",
# bbox='tight'
)
except:
logging.error(base)
# raise
else:
fig.savefig(
os.path.join(result_dir, "{}.{}".format(base, ext)),
transparent=True,
edgecolor="none",
facecolor="none",
# bbox='tight'
)
for num, base in zip(plt.get_fignums(), baseline_images):
for ext in extensions:
# plt.close(num)
actual = os.path.join(result_dir, "{}.{}".format(base, ext))
expected = os.path.join(baseline_dir, "{}.{}".format(base, ext))
if ext == "npz":
def do_test():
with pytest.skip:
if not os.path.exists(expected):
import shutil
shutil.copy2(actual, expected)
# shutil.copy2(os.path.join(result_dir, "{}.{}".format(base, 'png')), os.path.join(baseline_dir, "{}.{}".format(base, 'png')))
raise IOError(
"Baseline file {} not found, copying result {}".format(
expected, actual
)
)
else:
exp_dict = dict(np.load(expected).items())
act_dict = dict(np.load(actual).items())
for name in act_dict:
if name in exp_dict:
try:
np.testing.assert_allclose(
exp_dict[name],
act_dict[name],
err_msg="Mismatch in {}.{}".format(
base, name
),
rtol=rtol,
**kwargs
)
except AssertionError as e:
pass
else:
def do_test():
err = compare_images(expected, actual, tol, in_decorator=True)
if err:
print(
"Error between {} and {} is {:.5f}, which is bigger then the tolerance of {:.5f}".format(
actual, expected, err["rms"], tol
)
)
pass
yield do_test
plt.close("all")
def flatten_axis(ax, prevname=""):
import inspect
members = inspect.getmembers(ax)
arrays = {}
def _flatten(l, pre):
arr = {}
if isinstance(l, np.ndarray):
if l.size:
arr[pre] = np.asarray(l)
elif isinstance(l, dict):
for _n in l:
_tmp = _flatten(l, pre + "." + _n + ".")
for _nt in _tmp.keys():
arrays[_nt] = _tmp[_nt]
elif isinstance(l, list) and len(l) > 0:
for i in range(len(l)):
_tmp = _flatten(l[i], pre + "[{}]".format(i))
for _n in _tmp:
arr["{}".format(_n)] = _tmp[_n]
else:
return flatten_axis(l, pre + ".")
return arr
for name, l in members:
if isinstance(l, np.ndarray):
arrays[prevname + name] = np.asarray(l)
elif isinstance(l, list) and len(l) > 0:
for i in range(len(l)):
_tmp = _flatten(l[i], prevname + name + "[{}]".format(i))
for _n in _tmp:
arrays["{}".format(_n)] = _tmp[_n]
return arrays
def _a(x, y, decimal):
np.testing.assert_array_almost_equal(x, y, decimal)
def compare_axis_dicts(x, y, decimal=6):
try:
assert len(x) == len(y)
for name in x:
_a(x[name], y[name], decimal)
except AssertionError as e:
print(e.message)
pass
@pytest.mark.skipif(
matplotlib is None or baseline_dir is None, reason="Matplotlib not installed"
)
def test_figure():
np.random.seed(1239847)
from GPy.plotting import plotting_library as pl
# import matplotlib
matplotlib.rcParams.update(matplotlib.rcParamsDefault)
# matplotlib.rcParams[u'figure.figsize'] = (4,3)
matplotlib.rcParams["text.usetex"] = False
import warnings
with warnings.catch_warnings():
warnings.simplefilter("ignore")
ax, _ = pl().new_canvas(num="imshow_interact")
def test_func(x):
return x[:, 0].reshape(3, 3)
pl().imshow_interact(ax, test_func, extent=(-1, 1, -1, 1), resolution=3)
ax, _ = pl().new_canvas()
def test_func_2(x):
y = x[:, 0].reshape(3, 3)
anno = np.argmax(x, axis=1).reshape(3, 3)
return y, anno
pl().annotation_heatmap_interact(
ax, test_func_2, extent=(-1, 1, -1, 1), resolution=3
)
pl().annotation_heatmap_interact(
ax,
test_func_2,
extent=(-1, 1, -1, 1),
resolution=3,
imshow_kwargs=dict(interpolation="nearest"),
)
ax, _ = pl().new_canvas(figsize=(4, 3))
x = np.linspace(0, 1, 100)
y = [0, 1, 2]
array = np.array([0.4, 0.5])
cmap = matplotlib.colors.LinearSegmentedColormap.from_list(
"WhToColor", ("r", "b"), N=array.size
)
pl().fill_gradient(ax, x, y, facecolors=["r", "g"], array=array, cmap=cmap)
ax, _ = pl().new_canvas(
num="3d_plot",
figsize=(4, 3),
projection="3d",
xlabel="x",
ylabel="y",
zlabel="z",
title="awsome title",
xlim=(-1, 1),
ylim=(-1, 1),
zlim=(-3, 3),
)
z = 2 - np.abs(np.linspace(-2, 2, (100))) + 1
x, y = z * np.sin(np.linspace(-2 * np.pi, 2 * np.pi, (100))), z * np.cos(
np.linspace(-np.pi, np.pi, (100))
)
pl().plot(ax, x, y, z, linewidth=2)
for do_test in _image_comparison(
baseline_images=[
"coverage_{}".format(sub)
for sub in [
"imshow_interact",
"annotation_interact",
"gradient",
"3d_plot",
]
],
extensions=extensions,
):
yield (do_test,)
@pytest.mark.skipif(
matplotlib is None or baseline_dir is None, reason="Matplotlib not installed"
)
def test_kernel():
np.random.seed(1239847)
# import matplotlib
matplotlib.rcParams.update(matplotlib.rcParamsDefault)
# matplotlib.rcParams[u'figure.figsize'] = (4,3)
matplotlib.rcParams["text.usetex"] = False
import warnings
with warnings.catch_warnings():
warnings.simplefilter("ignore")
k = GPy.kern.RBF(5, ARD=True) * GPy.kern.Linear(
3, active_dims=[0, 2, 4], ARD=True
) + GPy.kern.Bias(2)
k.randomize()
k2 = (
GPy.kern.RBF(5, ARD=True)
* GPy.kern.Linear(3, active_dims=[0, 2, 4], ARD=True)
+ GPy.kern.Bias(2)
+ GPy.kern.White(4)
)
k2[:-1] = k[:]
k2.plot_ARD(["rbf", "linear", "bias"], legend=True)
k2.plot_covariance(visible_dims=[0, 3], plot_limits=(-1, 3))
k2.plot_covariance(visible_dims=[2], plot_limits=(-1, 3))
k2.plot_covariance(
visible_dims=[2, 4],
plot_limits=((-1, 0), (5, 3)),
projection="3d",
rstride=10,
cstride=10,
)
k2.plot_covariance(visible_dims=[1, 4])
for do_test in _image_comparison(
baseline_images=[
"kern_{}".format(sub)
for sub in ["ARD", "cov_2d", "cov_1d", "cov_3d", "cov_no_lim"]
],
extensions=extensions,
):
yield (do_test,)
@pytest.mark.skipif(
matplotlib is None or baseline_dir is None, reason="Matplotlib not installed"
)
def test_plot():
np.random.seed(111)
import matplotlib
matplotlib.rcParams.update(matplotlib.rcParamsDefault)
# matplotlib.rcParams[u'figure.figsize'] = (4,3)
matplotlib.rcParams["text.usetex"] = False
import warnings
with warnings.catch_warnings():
warnings.simplefilter("ignore")
X = np.random.uniform(-2, 2, (40, 1))
f = 0.2 * np.sin(1.3 * X) + 1.3 * np.cos(2 * X)
Y = f + np.random.normal(0, 0.1, f.shape)
m = GPy.models.SparseGPRegression(X, Y, X_variance=np.ones_like(X) * [0.06])
# m.optimize()
m.plot_data()
m.plot_mean()
m.plot_confidence()
m.plot_density()
m.plot_errorbars_trainset()
m.plot_samples()
m.plot_data_error()
for do_test in _image_comparison(
baseline_images=[
"gp_{}".format(sub)
for sub in [
"data",
"mean",
"conf",
"density",
"out_error",
"samples",
"in_error",
]
],
extensions=extensions,
):
yield (do_test,)
@pytest.mark.skipif(
matplotlib is None or baseline_dir is None, reason="Matplotlib not installed"
)
def test_twod():
np.random.seed(11111)
import matplotlib
matplotlib.rcParams.update(matplotlib.rcParamsDefault)
# matplotlib.rcParams[u'figure.figsize'] = (4,3)
matplotlib.rcParams["text.usetex"] = False
X = np.random.uniform(-2, 2, (40, 2))
f = 0.2 * np.sin(1.3 * X[:, [0]]) + 1.3 * np.cos(2 * X[:, [1]])
Y = f + np.random.normal(0, 0.1, f.shape)
m = GPy.models.SparseGPRegression(X, Y, X_variance=np.ones_like(X) * [0.01, 0.2])
# m.optimize()
m.plot_data()
m.plot_mean()
m.plot_inducing(legend=False, marker="s")
# m.plot_errorbars_trainset()
m.plot_data_error()
for do_test in _image_comparison(
baseline_images=[
"gp_2d_{}".format(sub)
for sub in [
"data",
"mean",
"inducing",
#'out_error',
"in_error",
]
],
extensions=extensions,
):
yield (do_test,)
@pytest.mark.skipif(
matplotlib is None or baseline_dir is None, reason="Matplotlib not installed"
)
def test_threed():
np.random.seed(11111)
import matplotlib
matplotlib.rcParams.update(matplotlib.rcParamsDefault)
# matplotlib.rcParams[u'figure.figsize'] = (4,3)
matplotlib.rcParams["text.usetex"] = False
X = np.random.uniform(-2, 2, (40, 2))
f = 0.2 * np.sin(1.3 * X[:, [0]]) + 1.3 * np.cos(2 * X[:, [1]])
Y = f + np.random.normal(0, 0.1, f.shape)
m = GPy.models.SparseGPRegression(X, Y)
m.likelihood.variance = 0.1
# m.optimize()
m.plot_samples(projection="3d", samples=1)
m.plot_samples(projection="3d", plot_raw=False, samples=1)
plt.close("all")
m.plot_data(projection="3d")
m.plot_mean(projection="3d", rstride=10, cstride=10)
m.plot_inducing(projection="3d")
# m.plot_errorbars_trainset(projection='3d')
for do_test in _image_comparison(
baseline_images=[
"gp_3d_{}".format(sub)
for sub in [
"data",
"mean",
"inducing",
]
],
extensions=extensions,
):
yield (do_test,)
@pytest.mark.skipif(
matplotlib is None or baseline_dir is None, reason="Matplotlib not installed"
)
def test_sparse():
np.random.seed(11111)
import matplotlib
matplotlib.rcParams.update(matplotlib.rcParamsDefault)
# matplotlib.rcParams[u'figure.figsize'] = (4,3)
matplotlib.rcParams["text.usetex"] = False
X = np.random.uniform(-2, 2, (40, 1))
f = 0.2 * np.sin(1.3 * X) + 1.3 * np.cos(2 * X)
Y = f + np.random.normal(0, 0.1, f.shape)
m = GPy.models.SparseGPRegression(X, Y, X_variance=np.ones_like(X) * 0.1)
# m.optimize()
# m.plot_inducing()
_, ax = plt.subplots()
m.plot_data(ax=ax)
m.plot_data_error(ax=ax)
for do_test in _image_comparison(
baseline_images=["sparse_gp_{}".format(sub) for sub in ["data_error"]],
extensions=extensions,
):
yield (do_test,)
@pytest.mark.skipif(
matplotlib is None or baseline_dir is None, reason="Matplotlib not installed"
)
def test_classification():
np.random.seed(11111)
import matplotlib
matplotlib.rcParams.update(matplotlib.rcParamsDefault)
# matplotlib.rcParams[u'figure.figsize'] = (4,3)
matplotlib.rcParams["text.usetex"] = False
X = np.random.uniform(-2, 2, (40, 1))
f = 0.2 * np.sin(1.3 * X) + 1.3 * np.cos(2 * X)
Y = f + np.random.normal(0, 0.1, f.shape)
m = GPy.models.GPClassification(X, Y > Y.mean())
# m.optimize()
_, ax = plt.subplots()
m.plot(plot_raw=False, apply_link=False, ax=ax, samples=3)
m.plot_errorbars_trainset(plot_raw=False, apply_link=False, ax=ax)
_, ax = plt.subplots()
m.plot(plot_raw=True, apply_link=False, ax=ax, samples=3)
m.plot_errorbars_trainset(plot_raw=True, apply_link=False, ax=ax)
_, ax = plt.subplots()
m.plot(plot_raw=True, apply_link=True, ax=ax, samples=3)
m.plot_errorbars_trainset(plot_raw=True, apply_link=True, ax=ax)
for do_test in _image_comparison(
baseline_images=[
"gp_class_{}".format(sub) for sub in ["likelihood", "raw", "raw_link"]
],
extensions=extensions,
):
yield (do_test,)
@pytest.mark.skipif(
matplotlib is None or baseline_dir is None, reason="Matplotlib not installed"
)
def test_sparse_classification():
np.random.seed(11111)
import matplotlib
matplotlib.rcParams.update(matplotlib.rcParamsDefault)
# matplotlib.rcParams[u'figure.figsize'] = (4,3)
matplotlib.rcParams["text.usetex"] = False
X = np.random.uniform(-2, 2, (40, 1))
f = 0.2 * np.sin(1.3 * X) + 1.3 * np.cos(2 * X)
Y = f + np.random.normal(0, 0.1, f.shape)
m = GPy.models.SparseGPClassification(X, Y > Y.mean())
# m.optimize()
m.plot(plot_raw=False, apply_link=False, samples_likelihood=3)
np.random.seed(111)
m.plot(plot_raw=True, apply_link=False, samples=3)
np.random.seed(111)
m.plot(plot_raw=True, apply_link=True, samples=3)
for do_test in _image_comparison(
baseline_images=[
"sparse_gp_class_{}".format(sub)
for sub in ["likelihood", "raw", "raw_link"]
],
extensions=extensions,
rtol=2,
):
yield (do_test,)
@pytest.mark.skipif(
matplotlib is None or baseline_dir is None, reason="Matplotlib not installed"
)
def test_gplvm():
from GPy.models import GPLVM
np.random.seed(12345)
matplotlib.rcParams.update(matplotlib.rcParamsDefault)
# matplotlib.rcParams[u'figure.figsize'] = (4,3)
matplotlib.rcParams["text.usetex"] = False
# Q = 3
# Define dataset
# N = 60
# k1 = GPy.kern.RBF(5, variance=1, lengthscale=1./np.random.dirichlet(np.r_[10,10,10,0.1,0.1]), ARD=True)
# k2 = GPy.kern.RBF(5, variance=1, lengthscale=1./np.random.dirichlet(np.r_[10,0.1,10,0.1,10]), ARD=True)
# k3 = GPy.kern.RBF(5, variance=1, lengthscale=1./np.random.dirichlet(np.r_[0.1,0.1,10,10,10]), ARD=True)
# X = np.random.normal(0, 1, (N, 5))
# A = np.random.multivariate_normal(np.zeros(N), k1.K(X), Q).T
# B = np.random.multivariate_normal(np.zeros(N), k2.K(X), Q).T
# C = np.random.multivariate_normal(np.zeros(N), k3.K(X), Q).T
# Y = np.vstack((A,B,C))
# labels = np.hstack((np.zeros(A.shape[0]), np.ones(B.shape[0]), np.ones(C.shape[0])*2))
# k = RBF(Q, ARD=True, lengthscale=2) # + kern.white(Q, _np.exp(-2)) # + kern.bias(Q)
pars = np.load(os.path.join(basedir, "b-gplvm-save.npz"))
Y = pars["Y"]
Q = pars["Q"]
labels = pars["labels"]
import warnings
with warnings.catch_warnings(record=True) as w:
warnings.simplefilter("always") # always print
m = GPLVM(Y, Q, initialize=False)
m.update_model(False)
m.initialize_parameter()
m[:] = pars["gplvm_p"]
m.update_model(True)
# m.optimize(messages=0)
np.random.seed(111)
m.plot_latent(labels=labels)
np.random.seed(111)
m.plot_scatter(projection="3d", labels=labels)
np.random.seed(111)
m.plot_magnification(labels=labels)
m.plot_steepest_gradient_map(resolution=10, data_labels=labels)
for do_test in _image_comparison(
baseline_images=[
"gplvm_{}".format(sub)
for sub in ["latent", "latent_3d", "magnification", "gradient"]
],
extensions=extensions,
tol=12,
):
yield (do_test,)
@pytest.mark.skipif(
matplotlib is None or baseline_dir is None, reason="Matplotlib not installed"
)
def test_bayesian_gplvm():
from ..models import BayesianGPLVM
np.random.seed(12345)
matplotlib.rcParams.update(matplotlib.rcParamsDefault)
# matplotlib.rcParams[u'figure.figsize'] = (4,3)
matplotlib.rcParams["text.usetex"] = False
# Q = 3
# Define dataset
# N = 10
# k1 = GPy.kern.RBF(5, variance=1, lengthscale=1./np.random.dirichlet(np.r_[10,10,10,0.1,0.1]), ARD=True)
# k2 = GPy.kern.RBF(5, variance=1, lengthscale=1./np.random.dirichlet(np.r_[10,0.1,10,0.1,10]), ARD=True)
# k3 = GPy.kern.RBF(5, variance=1, lengthscale=1./np.random.dirichlet(np.r_[0.1,0.1,10,10,10]), ARD=True)
# X = np.random.normal(0, 1, (N, 5))
# A = np.random.multivariate_normal(np.zeros(N), k1.K(X), Q).T
# B = np.random.multivariate_normal(np.zeros(N), k2.K(X), Q).T
# C = np.random.multivariate_normal(np.zeros(N), k3.K(X), Q).T
# Y = np.vstack((A,B,C))
# labels = np.hstack((np.zeros(A.shape[0]), np.ones(B.shape[0]), np.ones(C.shape[0])*2))
# k = RBF(Q, ARD=True, lengthscale=2) # + kern.white(Q, _np.exp(-2)) # + kern.bias(Q)
pars = np.load(os.path.join(basedir, "b-gplvm-save.npz"))
Y = pars["Y"]
Q = pars["Q"]
labels = pars["labels"]
import warnings
with warnings.catch_warnings(record=True) as w:
warnings.simplefilter("always") # always print
m = BayesianGPLVM(Y, Q, initialize=False)
m.update_model(False)
m.initialize_parameter()
m[:] = pars["bgplvm_p"]
m.update_model(True)
# m.optimize(messages=0)
np.random.seed(111)
m.plot_inducing(projection="2d")
np.random.seed(111)
m.plot_inducing(projection="3d")
np.random.seed(111)
m.plot_latent(projection="2d", labels=labels)
np.random.seed(111)
m.plot_scatter(projection="3d", labels=labels)
np.random.seed(111)
m.plot_magnification(labels=labels)
np.random.seed(111)
m.plot_steepest_gradient_map(resolution=10, data_labels=labels)
for do_test in _image_comparison(
baseline_images=[
"bayesian_gplvm_{}".format(sub)
for sub in [
"inducing",
"inducing_3d",
"latent",
"latent_3d",
"magnification",
"gradient",
]
],
extensions=extensions,
):
yield (do_test,)