From 8c5085120405be6df428c8b407d49cfb6e9d12cd Mon Sep 17 00:00:00 2001
From: John Jakeman <jdjakem@users.noreply.github.com>
Date: Tue, 21 May 2024 10:11:45 -0600
Subject: [PATCH 01/15] change environment.yml to allow only for python 3.8 and
 above

---
 environment.yml | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/environment.yml b/environment.yml
index 0af065ea..d3156171 100644
--- a/environment.yml
+++ b/environment.yml
@@ -3,8 +3,8 @@ channels:
   - defaults
   - conda-forge
 dependencies:
-  - python>3.6
-  - numpy>=1.26
+  - python>=3.8
+  - numpy>=1.20
   - matplotlib
   - scipy
   - jupyter

From fbb07737ed52dd8b333321cdb521baa3f7b86e49 Mon Sep 17 00:00:00 2001
From: John Jakeman <jdjakem@users.noreply.github.com>
Date: Tue, 21 May 2024 10:19:09 -0600
Subject: [PATCH 02/15] update ci file to create docs to use setup-miniconda@v3

---
 .github/workflows/continuous-integration-workflow-docs.yml | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/.github/workflows/continuous-integration-workflow-docs.yml b/.github/workflows/continuous-integration-workflow-docs.yml
index 464629cb..d0dfec09 100644
--- a/.github/workflows/continuous-integration-workflow-docs.yml
+++ b/.github/workflows/continuous-integration-workflow-docs.yml
@@ -29,9 +29,9 @@ jobs:
         # Expected 96 from C header, got 88 from PyObject
 
     steps:
-      - uses: actions/checkout@v2
+      - uses: actions/checkout@v4
       - name: Setup Miniconda with Python ${{ matrix.python-version }} on ${{ matrix.os }}
-        uses: conda-incubator/setup-miniconda@v2
+        uses: conda-incubator/setup-miniconda@v3
         with:
           activate-environment: pyapprox-base
           python-version: ${{ matrix.python-version }}

From fafad31388f65f656ba8a8ca114d1d5198242657 Mon Sep 17 00:00:00 2001
From: John Jakeman <jdjakem@users.noreply.github.com>
Date: Tue, 21 May 2024 10:40:17 -0600
Subject: [PATCH 03/15] Fix error with torchklewrapper

---
 .../continuous-integration-workflow-conda.yml          |  4 ++--
 pyapprox/expdesign/optbayes.py                         |  3 ++-
 pyapprox/pde/karhunen_loeve_expansion.py               |  7 ++++++-
 tutorials/expdesign/plot_bayesian_oed.py               | 10 +---------
 4 files changed, 11 insertions(+), 13 deletions(-)

diff --git a/.github/workflows/continuous-integration-workflow-conda.yml b/.github/workflows/continuous-integration-workflow-conda.yml
index 45cc55f8..0b135695 100644
--- a/.github/workflows/continuous-integration-workflow-conda.yml
+++ b/.github/workflows/continuous-integration-workflow-conda.yml
@@ -32,9 +32,9 @@ jobs:
         # Expected 96 from C header, got 88 from PyObject
 
     steps:
-      - uses: actions/checkout@v2
+      - uses: actions/checkout@v4
       - name: Setup Miniconda with Python ${{ matrix.python-version }} on ${{ matrix.os }}
-        uses: conda-incubator/setup-miniconda@v2
+        uses: conda-incubator/setup-miniconda@v3
         with:
           activate-environment: pyapprox-base
           python-version: ${{ matrix.python-version }}
diff --git a/pyapprox/expdesign/optbayes.py b/pyapprox/expdesign/optbayes.py
index 5512eb7e..2bff8ef2 100644
--- a/pyapprox/expdesign/optbayes.py
+++ b/pyapprox/expdesign/optbayes.py
@@ -262,7 +262,8 @@ def __init__(self, noise_cov_diag, outer_pred_obs,
 
     def __call__(self, design_weights):
         evidences = self._log_evidence._evidence(design_weights)
-        deviations = 
+        deviations = None
+
 
 class WeightsConstraintModel(Model):
     def __init__(self):
diff --git a/pyapprox/pde/karhunen_loeve_expansion.py b/pyapprox/pde/karhunen_loeve_expansion.py
index 7bb44836..2744dafe 100644
--- a/pyapprox/pde/karhunen_loeve_expansion.py
+++ b/pyapprox/pde/karhunen_loeve_expansion.py
@@ -15,7 +15,7 @@ def exponential_kle_eigenvalues(sigma2, corr_len, omega):
 def exponential_kle_basis(x, corr_len, sigma2, dom_len, omega):
     r"""
     Basis for the kernel K(x,y)=\sigma^2\exp(-|x-y|/l)
-
+ab
     Parameters
     ----------
     x : np.ndarray (num_spatial_locations)
@@ -426,6 +426,11 @@ def __call__(self, coef):
     def __repr__(self):
         return "TorchWrapper({0})".format(self._kle.__repr__())
 
+    def _compute_kernel_matrix(self):
+        import torch
+        return torch.as_tensor(
+            self.kle._compute_kernel_matrix(), dtype=torch.double)
+
 
 class DataDrivenKLE(AbstractKLE):
     def __init__(self, field_samples, mean_field=0,
diff --git a/tutorials/expdesign/plot_bayesian_oed.py b/tutorials/expdesign/plot_bayesian_oed.py
index 45ddfaeb..bd5f388c 100644
--- a/tutorials/expdesign/plot_bayesian_oed.py
+++ b/tutorials/expdesign/plot_bayesian_oed.py
@@ -4,7 +4,6 @@
 """
 #%%
 #Load modules
-import os
 from functools import partial
 from multiprocessing import Pool
 
@@ -41,13 +40,6 @@ def vertical_subplots(nx):
 horizontal = True
 subplots = horizontal_subplots
 
-#%%
-#Configure latex for plotting
-import matplotlib as mpl
-mpl.rcParams['text.usetex'] = True  # use latex for all text handling
-mpl.rcParams['text.latex.preamble'] = (
-    r'\usepackage{siunitx}\usepackage{amsmath}\usepackage{amssymb}')
-
 #%%
 #Setup prior and noise variables
 
@@ -165,7 +157,7 @@ def plot_data_surface_ribbons(design_pts, design_symbs, ax):
 
 design_pts = [np.array([[-1]]), np.array([[0.5]]), np.array([[1]])]
 # design_pts = [np.array([[0.25]]), np.array([[0.5]]), np.array([[1]])]
-design_symbs = [r"\xi", r"\xi^\prime", r"\xi^\dagger"]
+design_symbs = [r"\xi_1", r"\xi_2", r"\xi_3"]
 
 if prior_variable.num_vars() == 1:
     ax_ribbon = create_3d_axis()

From d896cbd44b7477d13b3e1bb4fae020f47d7f1dda Mon Sep 17 00:00:00 2001
From: John Jakeman <jdjakem@users.noreply.github.com>
Date: Wed, 22 May 2024 17:33:34 -0600
Subject: [PATCH 04/15] Change autogp kernels to accept linear algebra Mixin
 classes that allows them to be easily used for different packages such as
 numpy and torch. The kernels were then elevated to the surrogate module as
 they will be re-used in other kernel based methods besides GP

---
 pyapprox/surrogates/autogp/exactgp.py         | 131 ++++----
 pyapprox/surrogates/autogp/hyperparameter.py  | 155 ----------
 pyapprox/surrogates/autogp/kernels.py         | 253 ---------------
 pyapprox/surrogates/autogp/mokernels.py       | 235 +++-----------
 pyapprox/surrogates/autogp/numpytrends.py     |  14 +
 .../autogp/tests/test_gaussian_process.py     | 265 +++++++++-------
 .../surrogates/autogp/tests/test_kernels.py   |  87 ------
 .../surrogates/autogp/tests/test_mokernels.py | 141 +++++----
 pyapprox/surrogates/autogp/torchgp.py         | 136 +++++++++
 pyapprox/surrogates/autogp/torchtrends.py     |  14 +
 pyapprox/surrogates/autogp/trends.py          |  56 ++++
 pyapprox/surrogates/autogp/variationalgp.py   |  96 +++---
 pyapprox/surrogates/kernels/__init__.py       |   0
 pyapprox/surrogates/kernels/_kernels.py       | 289 ++++++++++++++++++
 pyapprox/surrogates/kernels/numpykernels.py   |  75 +++++
 pyapprox/surrogates/kernels/tests/__init__.py |   0
 .../surrogates/kernels/tests/test_kernels.py  | 120 ++++++++
 pyapprox/surrogates/kernels/torchkernels.py   |  91 ++++++
 pyapprox/util/hyperparameter/__init__.py      |   0
 .../util/hyperparameter/_hyperparameter.py    | 241 +++++++++++++++
 .../hyperparameter/numpyhyperparameter.py     |  22 ++
 .../hyperparameter/torchhyperparameter.py     |  22 ++
 pyapprox/util/linearalgebra/__init__.py       |   0
 pyapprox/util/linearalgebra/linalgbase.py     | 258 ++++++++++++++++
 pyapprox/util/linearalgebra/numpylinalg.py    | 140 +++++++++
 pyapprox/util/linearalgebra/torchlinalg.py    | 153 ++++++++++
 .../tests/test_hyperparameter.py              |  28 +-
 .../autogp => util}/tests/test_transforms.py  |  45 +--
 pyapprox/util/transforms/__init__.py          |   0
 .../transforms/_transforms.py}                | 115 ++++---
 pyapprox/util/transforms/numpytransforms.py   |  24 ++
 pyapprox/util/transforms/torchtransforms.py   |  24 ++
 setup.py                                      |   1 +
 33 files changed, 2185 insertions(+), 1046 deletions(-)
 delete mode 100644 pyapprox/surrogates/autogp/hyperparameter.py
 delete mode 100644 pyapprox/surrogates/autogp/kernels.py
 create mode 100644 pyapprox/surrogates/autogp/numpytrends.py
 delete mode 100644 pyapprox/surrogates/autogp/tests/test_kernels.py
 create mode 100644 pyapprox/surrogates/autogp/torchgp.py
 create mode 100644 pyapprox/surrogates/autogp/torchtrends.py
 create mode 100644 pyapprox/surrogates/autogp/trends.py
 create mode 100644 pyapprox/surrogates/kernels/__init__.py
 create mode 100644 pyapprox/surrogates/kernels/_kernels.py
 create mode 100644 pyapprox/surrogates/kernels/numpykernels.py
 create mode 100644 pyapprox/surrogates/kernels/tests/__init__.py
 create mode 100644 pyapprox/surrogates/kernels/tests/test_kernels.py
 create mode 100644 pyapprox/surrogates/kernels/torchkernels.py
 create mode 100644 pyapprox/util/hyperparameter/__init__.py
 create mode 100644 pyapprox/util/hyperparameter/_hyperparameter.py
 create mode 100644 pyapprox/util/hyperparameter/numpyhyperparameter.py
 create mode 100644 pyapprox/util/hyperparameter/torchhyperparameter.py
 create mode 100644 pyapprox/util/linearalgebra/__init__.py
 create mode 100644 pyapprox/util/linearalgebra/linalgbase.py
 create mode 100644 pyapprox/util/linearalgebra/numpylinalg.py
 create mode 100644 pyapprox/util/linearalgebra/torchlinalg.py
 rename pyapprox/{surrogates/autogp => util}/tests/test_hyperparameter.py (59%)
 rename pyapprox/{surrogates/autogp => util}/tests/test_transforms.py (57%)
 create mode 100644 pyapprox/util/transforms/__init__.py
 rename pyapprox/{surrogates/autogp/transforms.py => util/transforms/_transforms.py} (55%)
 create mode 100644 pyapprox/util/transforms/numpytransforms.py
 create mode 100644 pyapprox/util/transforms/torchtransforms.py

diff --git a/pyapprox/surrogates/autogp/exactgp.py b/pyapprox/surrogates/autogp/exactgp.py
index 8d9c75e1..47f866a1 100644
--- a/pyapprox/surrogates/autogp/exactgp.py
+++ b/pyapprox/surrogates/autogp/exactgp.py
@@ -1,40 +1,27 @@
+from abc import ABC, abstractmethod
 from typing import Tuple
+import warnings
+
 import numpy as np
 import torch
 import scipy
-import warnings
 
-from pyapprox.variables.transforms import IdentityTransformation
-from pyapprox.surrogates.autogp._torch_wrappers import (
-    diag, full, cholesky, cholesky_solve, log, solve_triangular, einsum,
-    multidot, array, asarray, sqrt, eye, vstack)
-from pyapprox.surrogates.autogp.kernels import Kernel, Monomial
-from pyapprox.surrogates.autogp.transforms import (
-    StandardDeviationValuesTransform)
 from pyapprox.surrogates.autogp.mokernels import MultiPeerKernel
 
 
-class ExactGaussianProcess():
+class ExactGaussianProcess(ABC):
     def __init__(self,
-                 nvars: int,
-                 kernel: Kernel,
-                 kernel_reg: float = 0,
-                 var_trans=None,
-                 values_trans=None,
-                 mean: Monomial = None):
+                 nvars,
+                 kernel,
+                 var_trans,
+                 values_trans,
+                 mean,
+                 kernel_reg):
         self.kernel = kernel
         self.mean = mean
         self.kernel_reg = kernel_reg
-        if var_trans is None:
-            self.var_trans = IdentityTransformation(nvars)
-        else:
-            self.var_trans = var_trans
-        if self.var_trans.num_vars() != nvars:
-            raise ValueError("var_trans and nvars are inconsistent")
-        if values_trans is None:
-            self.values_trans = StandardDeviationValuesTransform()
-        else:
-            self.values_trans = values_trans
+        self.var_trans = var_trans
+        self.values_trans = values_trans
 
         self._coef = None
         self._coef_args = None
@@ -55,14 +42,14 @@ def _training_kernel_matrix(self) -> Tuple:
         # kmat[np.diag_indices_from(kmat)] += self.kernel_reg
         # This also does not work
         # kmat += diag(full((kmat.shape[0], 1), float(self.kernel_reg)))
-        kmat = kmat + eye(kmat.shape[0])*float(self.kernel_reg)
+        kmat = kmat + self._la_eye(kmat.shape[0])*float(self.kernel_reg)
         return kmat
 
     def _factor_training_kernel_matrix(self):
         # can be specialized
         kmat = self._training_kernel_matrix()
         try:
-            return (cholesky(kmat), )
+            return (self._la_cholesky(kmat), )
         except:
             return None, kmat
 
@@ -70,28 +57,28 @@ def _solve_coefficients(self, *args) -> Tuple:
         # can be specialized when _factor_training_kernel_matrix is specialized
         diff = (self.canonical_train_values -
                 self._canonical_mean(self.canonical_train_samples))
-        return cholesky_solve(args[0], diff)
+        return self._la_cholesky_solve(args[0], diff)
 
     def _Linv_y(self, *args):
         diff = (self.canonical_train_values -
                 self._canonical_mean(self.canonical_train_samples))
-        return solve_triangular(args[0], diff)
+        return self._la_solve_triangular(args[0], diff)
 
     def _log_determinant(self, coef_res: Tuple) -> float:
         # can be specialized when _factor_training_kernel_matrix is specialized
         chol_factor = coef_res[0]
-        return 2*log(diag(chol_factor)).sum()
+        return 2*self._la_log(self._la_get_diagonal(chol_factor)).sum()
 
     def _canonical_posterior_pointwise_variance(
             self, canonical_samples, kmat_pred):
         # can be specialized when _factor_training_kernel_matrix is specialized
-        tmp = solve_triangular(self._coef_args[0], kmat_pred.T)
-        update = einsum("ji,ji->i", tmp, tmp)
+        tmp = self._la_solve_triangular(self._coef_args[0], kmat_pred.T)
+        update = self._la_einsum("ji,ji->i", tmp, tmp)
         return (self.kernel.diag(canonical_samples) - update)[:, None]
 
     def _canonical_mean(self, canonical_samples):
         if self.mean is None:
-            return full((canonical_samples.shape[1], 1), 0.)
+            return self._la_full((canonical_samples.shape[1], 1), 0.)
         return self.mean(canonical_samples)
 
     def _neg_log_likelihood_with_hyperparameter_mean(self) -> float:
@@ -99,11 +86,12 @@ def _neg_log_likelihood_with_hyperparameter_mean(self) -> float:
         # but cannot be used if assuming a prior on the coefficients
         coef_args = self._factor_training_kernel_matrix()
         if coef_args[0] is None:
+            print(coef_args)
             return coef_args[1][0, 0]*0+np.inf
         Linv_y = self._Linv_y(*coef_args)
         nsamples = self.canonical_train_values.shape[0]
         return 0.5 * (
-            multidot((Linv_y.T, Linv_y)) +
+            self._la_multidot((Linv_y.T, Linv_y)) +
             self._log_determinant(coef_args) +
             nsamples*np.log(2*np.pi)
         ).sum(axis=1)
@@ -129,27 +117,9 @@ def _neg_log_likelihood(self, active_opt_params):
         return self._neg_log_likelihood_with_hyperparameter_mean()
         # return self._neg_log_likelihood_with_uncertain_mean()
 
+    @abstractmethod
     def _fit_objective(self, active_opt_params_np):
-        # this is only pplace where torch should be called explicitly
-        # as we are using its functionality to compute the gradient of their
-        # negative log likelihood. We could replace this with a grad
-        # computed analytically
-        active_opt_params = torch.tensor(
-            active_opt_params_np, dtype=torch.double, requires_grad=True)
-        nll = self._neg_log_likelihood(active_opt_params)
-        nll.backward()
-        val = nll.item()
-        # copy is needed because zero_ is called
-        nll_grad = active_opt_params.grad.detach().numpy().copy()
-        active_opt_params.grad.zero_()
-        # must set requires grad to False after gradient is computed
-        # otherwise when evaluate_posterior will fail because it will
-        # still think the hyper_params require grad. Extra copies could be
-        # avoided by doing this after fit is complete. However then fit
-        # needs to know when torch is being used
-        for hyp in self.hyp_list.hyper_params:
-            hyp.detach()
-        return val, nll_grad
+        raise NotImplementedError
 
     def _local_optimize(self, init_active_opt_params_np, bounds):
         method = "L-BFGS-B"
@@ -183,17 +153,17 @@ def _global_optimize(self, max_nglobal_opt_iters=1):
                 best_idx = ii
                 best_obj = results[-1].fun
         self.hyp_list.set_active_opt_params(
-            asarray(results[best_idx].x))
+            self._la_atleast1d(results[best_idx].x))
 
-    def set_training_data(self, train_samples: array, train_values: array):
+    def set_training_data(self, train_samples, train_values):
         self.train_samples = train_samples
         self.train_values = train_values
-        self.canonical_train_samples = asarray(
+        self.canonical_train_samples = (
             self._map_samples_to_canonical(train_samples))
-        self.canonical_train_values = asarray(
+        self.canonical_train_values = (
             self.values_trans.map_to_canonical(train_values))
 
-    def fit(self, train_samples: array, train_values: array, **kwargs):
+    def fit(self, train_samples, train_values, **kwargs):
         self.set_training_data(train_samples, train_values)
         self._global_optimize(**kwargs)
 
@@ -203,7 +173,7 @@ def _evaluate_prior(self, samples, return_std):
         if not return_std:
             return mean
         return mean, self.values_trans.map_stdev_from_canonical(
-            sqrt(self.kernel.diag(samples)))
+            self._la_sqrt(self.kernel.diag(samples)))
 
     def _map_samples_to_canonical(self, samples):
         return self.var_trans.map_to_canonical(samples)
@@ -218,8 +188,8 @@ def _evaluate_posterior(self, samples, return_std):
         canonical_samples = self._map_samples_to_canonical(samples)
         kmat_pred = self.kernel(
             canonical_samples, self.canonical_train_samples)
-        canonical_mean = self._canonical_mean(canonical_samples) + multidot((
-            kmat_pred, self._coef))
+        canonical_mean = (self._canonical_mean(canonical_samples) +
+                          self._la_multidot((kmat_pred, self._coef)))
         mean = self.values_trans.map_from_canonical(canonical_mean)
         if not return_std:
             return mean
@@ -307,10 +277,9 @@ def set_training_data(self, train_samples: list, train_values: list):
         self.train_samples = train_samples
         self.train_values = train_values
         self.canonical_train_samples = [
-            asarray(s) for s in self._map_samples_to_canonical(train_samples)]
-        self.canonical_train_values = vstack(
-            [asarray(self.values_trans.map_to_canonical(v))
-             for v in train_values])
+            s for s in self._map_samples_to_canonical(train_samples)]
+        self.canonical_train_values = self._la_vstack(
+            [self.values_trans.map_to_canonical(v) for v in train_values])
 
     def _map_samples_to_canonical(self, samples):
         return [self.var_trans.map_to_canonical(s) for s in samples]
@@ -318,7 +287,8 @@ def _map_samples_to_canonical(self, samples):
     def _canonical_mean(self, canonical_samples):
         if self.mean is not None:
             raise ValueError("Non-zero mean not supported for mulitoutput")
-        return full((sum([s.shape[1] for s in canonical_samples]), 1), 0.)
+        return self._la_full(
+            (sum([s.shape[1] for s in canonical_samples]), 1), 0.)
 
     def plot_1d(self, ax, bounds, output_id, npts_1d=101, nstdevs=2,
                 plt_kwargs={}, fill_kwargs={'alpha': 0.3}, prior_kwargs=None,
@@ -356,11 +326,11 @@ def _solve_coefficients(self, *args) -> Tuple:
         # can be specialized when _factor_training_kernel_matrix is specialized
         diff = (self.canonical_train_values -
                 self._canonical_mean(self.canonical_train_samples))
-        return MultiPeerKernel._cholesky_solve(*args, diff)
+        return MultiPeerKernel._cholesky_solve(*args, diff, self)
 
     def _log_determinant(self, coef_res: Tuple) -> float:
         # can be specialized when _factor_training_kernel_matrix is specialized
-        return MultiPeerKernel._logdet(*coef_res)
+        return MultiPeerKernel._logdet(*coef_res, self)
 
     def _training_kernel_matrix(self) -> Tuple:
         # must only pass in X and not Y to kernel otherwise if noise kernel
@@ -369,11 +339,13 @@ def _training_kernel_matrix(self) -> Tuple:
         for ii in range(len(blocks)):
             blocks[ii][ii] = (
                 blocks[ii][ii] +
-                eye(blocks[ii][ii].shape[0])*float(self.kernel_reg))
+                self._la_eye(blocks[ii][ii].shape[0])*float(self.kernel_reg))
         return blocks
 
     def _factor_training_kernel_matrix(self):
         blocks = self._training_kernel_matrix()
+        return MultiPeerKernel._cholesky(
+                len(blocks[0]), blocks, block_format=True, la=self)
         try:
             return MultiPeerKernel._cholesky(
                 len(blocks[0]), blocks, block_format=True)
@@ -383,27 +355,27 @@ def _factor_training_kernel_matrix(self):
     def _Linv_y(self, *args):
         diff = (self.canonical_train_values -
                 self._canonical_mean(self.canonical_train_samples))
-        return MultiPeerKernel._lower_solve_triangular(*args, diff)
+        return MultiPeerKernel._lower_solve_triangular(*args, diff, self)
 
     def _canonical_posterior_pointwise_variance(
             self, canonical_samples, kmat_pred):
         # can be specialized when _factor_training_kernel_matrix is specialized
         tmp = MultiPeerKernel._lower_solve_triangular(
-            *self._coef_args, kmat_pred.T)
-        update = einsum("ji,ji->i", tmp, tmp)
+            *self._coef_args, kmat_pred.T, self)
+        update = self._la_einsum("ji,ji->i", tmp, tmp)
         return (self.kernel.diag(canonical_samples) - update)[:, None]
 
 
 class MOICMPeerExactGaussianProcess(MOExactGaussianProcess):
     def __init__(self,
-                 nvars: int,
-                 kernel: Kernel,
+                 nvars,
+                 kernel,
                  output_kernel,
-                 kernel_reg: float = 0,
-                 var_trans=None,
-                 values_trans=None):
+                 var_trans,
+                 values_trans,
+                 kernel_reg):
         super().__init__(
-            nvars, kernel, kernel_reg, var_trans, values_trans, None)
+            nvars, kernel, var_trans, values_trans, None, kernel_reg)
         self.output_kernel = output_kernel
 
     @staticmethod
@@ -443,6 +415,7 @@ def _get_constraints(self, noutputs):
         return icm_cons
 
     def _local_optimize(self, init_active_opt_params_np, bounds):
+        # TODO use new optimization classes
         method = "trust-constr"
         # method = "slsqp"
         if method == "trust-constr":
diff --git a/pyapprox/surrogates/autogp/hyperparameter.py b/pyapprox/surrogates/autogp/hyperparameter.py
deleted file mode 100644
index 6eab7f09..00000000
--- a/pyapprox/surrogates/autogp/hyperparameter.py
+++ /dev/null
@@ -1,155 +0,0 @@
-import numpy as np
-from abc import ABC, abstractmethod
-from pyapprox.surrogates.autogp._torch_wrappers import (
-    log, exp, atleast1d, repeat, arange, isnan, vstack, hstack, copy)
-
-
-class HyperParameterTransform(ABC):
-    @abstractmethod
-    def to_opt_space(self, params):
-        raise NotImplementedError
-
-    @abstractmethod
-    def from_opt_space(self, params):
-        raise NotImplementedError
-
-    def __repr__(self):
-        return "{0}".format(self.__class__.__name__)
-
-
-class IdentityHyperParameterTransform(HyperParameterTransform):
-    def to_opt_space(self, params):
-        return params
-
-    def from_opt_space(self, params):
-        return params
-
-
-class LogHyperParameterTransform(HyperParameterTransform):
-    def to_opt_space(self, params):
-        return log(params)
-
-    def from_opt_space(self, params):
-        return exp(params)
-
-
-class HyperParameter():
-    def __init__(self, name: str, nvars: int, values: np.ndarray,
-                 bounds: np.ndarray, transform: HyperParameterTransform):
-        self.name = name
-        self._nvars = nvars
-        self._values = atleast1d(values)
-        if self._values.shape[0] == 1:
-            self._values = repeat(self._values, self.nvars())
-        if self._values.ndim == 2:
-            raise ValueError("values is not a 1D array")
-        if self._values.shape[0] != self.nvars():
-            raise ValueError("values shape {0} inconsistent with nvars".format(
-                self._values.shape))
-        self.bounds = atleast1d(bounds)
-        if self.bounds.shape[0] == 2:
-            self.bounds = repeat(self.bounds, self.nvars())
-        if self.bounds.shape[0] != 2*self.nvars():
-            msg = "bounds shape {0} inconsistent with 2*nvars={1}".format(
-                self.bounds.shape, 2*self.nvars())
-            raise ValueError(msg)
-        self.bounds = self.bounds.reshape((self.bounds.shape[0]//2, 2))
-        self.transform = transform
-        if np.where(
-                (self._values < self.bounds[:, 0]) |
-                (self._values > self.bounds[:, 1]))[0].shape[0] > 0:
-            raise ValueError("values outside bounds")
-        self._active_indices = np.atleast_1d(
-            arange(self.nvars())[~isnan(self.bounds[:, 0])])
-
-    def nvars(self):
-        return self._nvars
-
-    def nactive_vars(self):
-        return self._active_indices.shape[0]
-
-    def set_active_opt_params(self, active_params):
-        # The copy ensures that the error
-        # "a leaf Variable that requires grad is being used in an in-place operation.
-        # is not thrown
-        self._values = copy(self._values)
-        self._values[self._active_indices] = self.transform.from_opt_space(
-            active_params)
-
-    def get_active_opt_params(self):
-        return self.transform.to_opt_space(self._values[self._active_indices])
-
-    def get_active_opt_bounds(self):
-        return self.transform.to_opt_space(
-            self.bounds[self._active_indices, :])
-
-    def get_values(self):
-        return self._values
-
-    def set_values(self, values):
-        self._values = values
-
-    def _short_repr(self):
-        if self.nvars() > 5:
-            return "{0}:nvars={1}".format(self.name, self.nvars())
-
-        return "{0}={1}".format(
-            self.name,
-            "["+", ".join(map("{0:.2g}".format, self._values))+"]")
-
-    def __repr__(self):
-        if self.nvars() > 5:
-            return "{0}(name={1}, nvars={2}, transform={3}, nactive={4})".format(
-                self.__class__.__name__, self.name, self.nvars(),
-                self.transform, self.nactive_vars())
-        return "{0}(name={1}, values={2}, transform={3}, active={4})".format(
-            self.__class__.__name__, self.name,
-            "["+", ".join(map("{0:.2g}".format, self.get_values()))+"]",
-            self.transform,
-            "["+", ".join(map("{0}".format, self._active_indices))+"]")
-
-    def detach(self):
-        self.set_values(self.get_values().detach())
-
-
-class HyperParameterList():
-    def __init__(self, hyper_params: list):
-        self.hyper_params = hyper_params
-
-    def set_active_opt_params(self, active_params):
-        cnt = 0
-        for hyp in self.hyper_params:
-            hyp.set_active_opt_params(
-                active_params[cnt:cnt+hyp.nactive_vars()])
-            cnt += hyp.nactive_vars()
-
-    def get_active_opt_params(self):
-        return hstack(
-            [hyp.get_active_opt_params() for hyp in self.hyper_params])
-
-    def get_active_opt_bounds(self):
-        return vstack(
-            [hyp.get_active_opt_bounds() for hyp in self.hyper_params])
-
-    def get_values(self):
-        return hstack([hyp.get_values() for hyp in self.hyper_params])
-
-    def __add__(self, hyp_list):
-        return HyperParameterList(self.hyper_params+hyp_list.hyper_params)
-
-    def __radd__(self, hyp_list):
-        if hyp_list == 0:
-            # for when sum is called over list of HyperParameterLists
-            return self
-        return HyperParameterList(hyp_list.hyper_params+self.hyper_params)
-
-    def _short_repr(self):
-        # simpler representation used when printing kernels
-        return (
-            ", ".join(
-                map("{0}".format,
-                    [hyp._short_repr() for hyp in self.hyper_params])))
-
-    def __repr__(self):
-        return ("{0}(".format(self.__class__.__name__) +
-                ",\n\t\t   ".join(map("{0}".format, self.hyper_params))+")")
diff --git a/pyapprox/surrogates/autogp/kernels.py b/pyapprox/surrogates/autogp/kernels.py
deleted file mode 100644
index e7675594..00000000
--- a/pyapprox/surrogates/autogp/kernels.py
+++ /dev/null
@@ -1,253 +0,0 @@
-import numpy as np
-from typing import Union
-from abc import ABC, abstractmethod
-
-from pyapprox.surrogates.autogp._torch_wrappers import (
-    full, asarray, sqrt, exp, inf, cdist, array, to_numpy, cholesky, empty,
-    arange, sin, eye)
-from pyapprox.surrogates.autogp.hyperparameter import (
-    HyperParameter, HyperParameterList, IdentityHyperParameterTransform,
-    LogHyperParameterTransform)
-from pyapprox.surrogates.interp.indexing import compute_hyperbolic_indices
-
-
-class Kernel(ABC):
-    @abstractmethod
-    def diag(self, X):
-        raise NotImplementedError
-
-    @abstractmethod
-    def __call__(self, X, Y=None):
-        raise NotImplementedError()
-
-    def __mul__(self, kernel):
-        return ProductKernel(self, kernel)
-
-    def __add__(self, kernel):
-        return SumKernel(self, kernel)
-
-    def __repr__(self):
-        return "{0}({1})".format(
-            self.__class__.__name__, self.hyp_list._short_repr())
-
-    def _cholesky(self, kmat):
-        return cholesky(kmat)
-
-
-class MaternKernel(Kernel):
-    def __init__(self, nu: float,
-                 lenscale: Union[float, array],
-                 lenscale_bounds: array,
-                 nvars: int):
-        self._nvars = nvars
-        self.nu = nu
-        self._lenscale = HyperParameter(
-            "lenscale", nvars, lenscale, lenscale_bounds,
-            LogHyperParameterTransform())
-        self.hyp_list = HyperParameterList([self._lenscale])
-
-    def diag(self, X):
-        return full((X.shape[1],), 1)
-
-    def _eval_distance_form(self, distances):
-        if self.nu == 0.5:
-            return exp(-distances)
-        if self.nu == 1.5:
-            tmp = distances * np.sqrt(3)
-            return (1.0 + tmp) * exp(-tmp)
-        if self.nu == 2.5:
-            tmp = distances * np.sqrt(5)
-            return (1.0 + tmp + tmp**2/3.0) * exp(-tmp)
-        if self.nu == inf:
-            return exp(-(distances**2)/2.0)
-        raise ValueError("Matern kernel with nu={0} not supported".format(
-            self.nu))
-
-    def __call__(self, X, Y=None):
-        lenscale = self._lenscale.get_values()
-        X = asarray(X)
-        if Y is None:
-            Y = X
-        else:
-            Y = asarray(Y)
-        distances = cdist(X.T/lenscale, Y.T/lenscale)
-        return self._eval_distance_form(distances)
-
-    def nvars(self):
-        return self._nvars
-
-
-class ConstantKernel(Kernel):
-    def __init__(self, constant, constant_bounds=[-inf, inf],
-                 transform=IdentityHyperParameterTransform()):
-        self._const = HyperParameter(
-            "const", 1, constant, constant_bounds, transform)
-        self.hyp_list = HyperParameterList([self._const])
-
-    def diag(self, X):
-        return full((X.shape[1],), self.hyp_list.get_values()[0])
-
-    def __call__(self, X, Y=None):
-        X = asarray(X)
-        if Y is None:
-            Y = X
-        else:
-            Y = asarray(Y)
-        # full does not work when const value requires grad
-        # return full((X.shape[1], Y.shape[1]), self._const.get_values()[0])
-        const = empty((X.shape[1], Y.shape[1]))
-        const[:] = self._const.get_values()[0]
-        return const
-
-
-class GaussianNoiseKernel(Kernel):
-    def __init__(self, constant, constant_bounds=[-inf, inf],
-                 transform=IdentityHyperParameterTransform()):
-        self._const = HyperParameter(
-            "const", 1, constant, constant_bounds, transform)
-        self.hyp_list = HyperParameterList([self._const])
-
-    def diag(self, X):
-        return full((X.shape[1],), self.hyp_list.get_values()[0])
-
-    def __call__(self, X, Y=None):
-        X = asarray(X)
-        if Y is None:
-            return self._const.get_values()[0]*eye(X.shape[1])
-        # full does not work when const value requires grad
-        # return full((X.shape[1], Y.shape[1]), self._const.get_values()[0])
-        const = full((X.shape[1], Y.shape[1]), 0.)
-        return const
-
-
-class ProductKernel(Kernel):
-    def __init__(self, kernel1, kernel2):
-        self.kernel1 = kernel1
-        self.kernel2 = kernel2
-        self.hyp_list = kernel1.hyp_list+kernel2.hyp_list
-
-    def diag(self, X):
-        return self.kernel1.diag(X) * self.kernel2.diag(X)
-
-    def __repr__(self):
-        return "{0} * {1}".format(self.kernel1, self.kernel2)
-
-    def __call__(self, X, Y=None):
-        return self.kernel1(X, Y) * self.kernel2(X, Y)
-
-
-class SumKernel(Kernel):
-    def __init__(self, kernel1, kernel2):
-        self.kernel1 = kernel1
-        self.kernel2 = kernel2
-        self.hyp_list = kernel1.hyp_list+kernel2.hyp_list
-
-    def diag(self, X):
-        return self.kernel1.diag(X) + self.kernel2.diag(X)
-
-    def __repr__(self):
-        return "{0} + {1}".format(self.kernel1, self.kernel2)
-
-    def __call__(self, X, Y=None):
-        return self.kernel1(X, Y) + self.kernel2(X, Y)
-
-
-def univariate_monomial_basis_matrix(max_level, samples):
-    assert samples.ndim == 1
-    basis_matrix = samples[:, None]**arange(max_level+1)[None, :]
-    return basis_matrix
-
-
-def monomial_basis_matrix(indices, samples):
-    """
-    Evaluate a multivariate monomial basis at a set of samples.
-
-    Parameters
-    ----------
-    indices : np.ndarray (num_vars, num_indices)
-        The exponents of each monomial term
-
-    samples : np.ndarray (num_vars, num_samples)
-        Samples at which to evaluate the monomial
-
-    Return
-    ------
-    basis_matrix : np.ndarray (num_samples, num_indices)
-        The values of the monomial basis at the samples
-    """
-    num_vars, num_indices = indices.shape
-    assert samples.shape[0] == num_vars
-    num_samples = samples.shape[1]
-
-    deriv_order = 0
-    basis_matrix = empty(
-        ((1+deriv_order*num_vars)*num_samples, num_indices))
-    basis_vals_1d = [univariate_monomial_basis_matrix(
-        indices[0, :].max(), samples[0, :])]
-    basis_matrix[:num_samples, :] = basis_vals_1d[0][:, indices[0, :]]
-    for dd in range(1, num_vars):
-        basis_vals_1d.append(univariate_monomial_basis_matrix(
-            indices[dd, :].max(), samples[dd, :]))
-        basis_matrix[:num_samples, :] *= basis_vals_1d[dd][:, indices[dd, :]]
-    return basis_matrix
-
-
-class Monomial():
-    def __init__(self, nvars, degree, coefs, coef_bounds,
-                 transform=IdentityHyperParameterTransform(),
-                 name="MonomialCoefficients"):
-        self._nvars = nvars
-        self.degree = degree
-        self.indices = compute_hyperbolic_indices(self.nvars(), self.degree)
-        self.nterms = self.indices.shape[1]
-        self._coef = HyperParameter(
-            name, self.nterms, coefs, coef_bounds, transform)
-        self.hyp_list = HyperParameterList([self._coef])
-
-    def nvars(self):
-        return self._nvars
-
-    def basis_matrix(self, samples):
-        return monomial_basis_matrix(self.indices, asarray(samples))
-
-    def __call__(self, samples):
-        if self.degree == 0:
-            vals = empty((samples.shape[1], 1))
-            vals[:] = self._coef.get_values()
-            return vals
-        basis_mat = self.basis_matrix(samples)
-        vals = basis_mat @ self._coef.get_values()
-        return asarray(vals[:, None])
-
-    def __repr__(self):
-        return "{0}(name={1}, nvars={2}, degree={3}, nterms={4})".format(
-            self.__class__.__name__, self._coef.name, self.nvars(),
-            self.degree, self.nterms)
-
-
-class PeriodicMaternKernel(MaternKernel):
-    def __init__(self,
-                 nu: float,
-                 period: Union[float, array],
-                 period_bounds: array,
-                 lenscale: Union[float, array],
-                 lenscale_bounds: array):
-        super().__init__(nu, lenscale, lenscale_bounds, 1)
-        self._period = HyperParameter(
-            "period", 1, lenscale, lenscale_bounds,
-            LogHyperParameterTransform())
-        self.hyp_list += HyperParameterList([self._period])
-
-    def __call__(self, X, Y=None):
-        X = asarray(X)
-        if Y is None:
-            Y = X
-        else:
-            Y = asarray(Y)
-        lenscale = self._lenscale.get_values()
-        period = self._period.get_values()
-        distances = cdist(X.T/period, Y.T/period)/lenscale
-        return super()._eval_distance_form(distances)
-
-    def diag(self, X):
-        return super().diag(X)
diff --git a/pyapprox/surrogates/autogp/mokernels.py b/pyapprox/surrogates/autogp/mokernels.py
index 1dc9c86e..46a02988 100644
--- a/pyapprox/surrogates/autogp/mokernels.py
+++ b/pyapprox/surrogates/autogp/mokernels.py
@@ -1,14 +1,7 @@
 from abc import abstractmethod
 import numpy as np
 
-from pyapprox.surrogates.autogp.kernels import Kernel
-from pyapprox.surrogates.autogp._torch_wrappers import (
-    full, asarray, hstack, vstack, cholesky, solve_triangular, multidot,
-    cos, to_numpy, atleast1d, repeat, empty, log)
-from pyapprox.surrogates.autogp.hyperparameter import (
-    HyperParameter, HyperParameterList, IdentityHyperParameterTransform)
-from pyapprox.surrogates.autogp.transforms import (
-    SphericalCorrelationTransform)
+from pyapprox.surrogates.kernels._kernels import Kernel, SphericalCovariance
 
 
 class MultiOutputKernel(Kernel):
@@ -21,6 +14,11 @@ def __init__(self, kernels, noutputs):
         self.nsamples_per_output_0 = None
         self.nsamples_per_output_1 = None
 
+        # make linear algebra functions accessible via product_kernel._la_
+        for attr in dir(kernels[0]):
+            if len(attr) >= 4 and attr[:4] == "_la_":
+                setattr(self, attr, getattr(self.kernels[0], attr))
+
     @abstractmethod
     def _scale_block(self, samples_per_output_ii, ii,
                      samples_per_output_jj, jj, kk, symmetric):
@@ -45,8 +43,8 @@ def _evaluate_block(self, samples_per_output_ii, ii,
         if not block_format:
             if nonzero:
                 return block
-            return full((samples_per_output_ii.shape[1],
-                         samples_per_output_jj.shape[1]), 0.)
+            return self._la_full((samples_per_output_ii.shape[1],
+                                  samples_per_output_jj.shape[1]), 0.)
         if nonzero:
             return block
         return None
@@ -59,7 +57,7 @@ def __call__(self, samples_0, samples_1=None, block_format=False):
             only return upper-traingular blocks, and set lower-triangular
             blocks to None
         """
-        samples_0 = [asarray(s) for s in samples_0]
+        samples_0 = [s for s in samples_0]
         if samples_1 is None:
             samples_1 = samples_0
             symmetric = True
@@ -81,12 +79,13 @@ def __call__(self, samples_0, samples_1=None, block_format=False):
                     samples_0[idx0], idx0, samples_1[idx1], idx1,
                     block_format, symmetric)
         if not block_format:
-            rows = [hstack(matrix_blocks[ii]) for ii in range(noutputs_0)]
-            return vstack(rows)
+            rows = [self._la_hstack(matrix_blocks[ii])
+                    for ii in range(noutputs_0)]
+            return self._la_vstack(rows)
         return matrix_blocks
 
     def diag(self, samples_0):
-        samples_0 = [asarray(s) for s in samples_0]
+        # samples_0 = [asarray(s) for s in samples_0]
         nsamples_0 = np.asarray([s.shape[1] for s in samples_0])
         active_outputs_0 = np.where(nsamples_0 > 0)[0]
         noutputs_0 = active_outputs_0.shape[0]
@@ -99,7 +98,7 @@ def diag(self, samples_0):
                 if diag_iikk is not None:
                     diag_ii += diag_iikk
             diags.append(diag_ii)
-        return hstack(diags)
+        return self._la_hstack(diags)
 
     def __repr__(self):
         if self.nsamples_per_output_0 is None:
@@ -149,25 +148,6 @@ def _scale_diag(self, samples_per_output_ii, ii, kk):
         return None
 
 
-def _block_cholesky(L_A, L_A_inv_B, B, D, return_blocks):
-    schur_comp = D-multidot((L_A_inv_B.T, L_A_inv_B))
-    L_S = cholesky(schur_comp)
-    chol_blocks = [L_A, L_A_inv_B.T, L_S]
-    if return_blocks:
-        return chol_blocks
-    return vstack([
-        hstack([chol_blocks[0], 0*L_A_inv_B]),
-        hstack([chol_blocks[1], chol_blocks[2]])])
-
-
-def block_cholesky(blocks, return_blocks=False):
-    A, B = blocks[0]
-    D = blocks[1][1]
-    L_A = cholesky(A)
-    L_A_inv_B = solve_triangular(L_A, B)
-    return _block_cholesky(L_A, L_A_inv_B, B, D, return_blocks)
-
-
 class MultiPeerKernel(SpatiallyScaledMultiOutputKernel):
     def _validate_kernels_and_scalings(self, kernels, scalings):
         if len(scalings) != len(kernels)-1:
@@ -180,40 +160,42 @@ def _get_kernel_combination_matrix_entry(self, samples, ii, kk):
         if ii == self.noutputs-1:
             if kk < self.noutputs-1:
                 return self.scalings[kk](samples)
-            return full((samples.shape[1], 1), 1.)
+            return self._la_full((samples.shape[1], 1), 1.)
         if ii == kk:
-            return full((samples.shape[1], 1), 1.)
+            return self._la_full((samples.shape[1], 1), 1.)
         return None
 
     @staticmethod
-    def _cholesky(noutputs, blocks, block_format=False):
+    def _cholesky(noutputs, blocks, block_format=False, la=None):
         chol_blocks = []
         L_A_inv_B_list = []
         for ii in range(noutputs-1):
             row = [None for ii in range(noutputs)]
             for jj in range(noutputs):
                 if jj == ii:
-                    row[ii] = cholesky(blocks[ii][ii])
+                    row[ii] = la._la_cholesky(blocks[ii][ii])
                 elif not block_format:
-                    row[jj] = full(
+                    row[jj] = la._la_full(
                         (blocks[ii][ii].shape[0],
                          blocks[jj][noutputs-1].shape[0]), 0.)
             chol_blocks.append(row)
-            L_A_inv_B_list.append(solve_triangular(row[ii], blocks[ii][-1]))
-        B = vstack([blocks[jj][-1] for jj in range(noutputs-1)]).T
+            L_A_inv_B_list.append(
+                la._la_solve_triangular(row[ii], blocks[ii][-1]))
+        B = la._la_vstack([blocks[jj][-1] for jj in range(noutputs-1)]).T
         D = blocks[-1][-1]
-        L_A_inv_B = vstack(L_A_inv_B_list)
+        L_A_inv_B = la._la_vstack(L_A_inv_B_list)
         if not block_format:
-            L_A = vstack([hstack(row[:-1]) for row in chol_blocks])
-            return _block_cholesky(
+            L_A = la._la_vstack(
+                [la._la_hstack(row[:-1]) for row in chol_blocks])
+            return la._la_block_cholesky_engine(
                 L_A, L_A_inv_B, B, D, block_format)
-        return _block_cholesky(
+        return la._la_block_cholesky_engine(
                 chol_blocks, L_A_inv_B, B, D, block_format)
 
     @staticmethod
-    def _cholesky_blocks_to_dense(A, C, D):
+    def _cholesky_blocks_to_dense(A, C, D, la):
         shape = sum([A[ii][ii].shape[0] for ii in range(len(A))])
-        L = np.zeros((shape+C.shape[0], shape+D.shape[1]))
+        L = la._la_full((shape+C.shape[0], shape+D.shape[1]), 0.)
         cnt = 0
         for ii in range(len(A)):
             L[cnt:cnt+A[ii][ii].shape[0], cnt:cnt+A[ii][ii].shape[0]] = (
@@ -224,53 +206,54 @@ def _cholesky_blocks_to_dense(A, C, D):
         return L
 
     @staticmethod
-    def _logdet(A, C, D):
+    def _logdet(A, C, D, la):
         log_det = 0
         for ii, row in enumerate(A):
-            log_det += 2*log(row[ii].diag()).sum()
-        log_det += 2*log(D.diag()).sum()
+            log_det += 2*la._la_log(la._la_get_diagonal(row[ii])).sum()
+        log_det += 2*la._la_log(la._la_get_diagonal(D)).sum()
         return log_det
 
     @staticmethod
-    def _lower_solve_triangular(A, C, D, values):
+    def _lower_solve_triangular(A, C, D, values, la):
         # Solve Lx=y when L is the cholesky factor
         # of a peer kernel
         coefs = []
         cnt = 0
         for ii, row in enumerate(A):
             coefs.append(
-                solve_triangular(
-                    row[ii], values[cnt:cnt+row[ii].shape[0]], upper=False))
+                la._la_solve_triangular(
+                    row[ii], values[cnt:cnt+row[ii].shape[0]], lower=True))
             cnt += row[ii].shape[0]
-        coefs = vstack(coefs)
-        coefs = vstack(
-            (coefs, solve_triangular(D,  values[cnt:]-C@coefs, upper=False)))
+        coefs = la._la_vstack(coefs)
+        coefs = la._la_vstack(
+            (coefs, la._la_solve_triangular(
+                D,  values[cnt:]-C@coefs, lower=True)))
         return coefs
 
     @staticmethod
-    def _upper_solve_triangular(A, C, D, values):
+    def _upper_solve_triangular(A, C, D, values, la):
         # Solve L^Tx=y when L is the cholesky factor
         # of a peer kernel.
         # A, C, D all are from lower-triangular factor L (not L^T)
         # so must take transpose of all blocks
         idx1 = values.shape[0]
         idx0 = idx1 - D.shape[1]
-        coefs = [solve_triangular(D.T, values[idx0:idx1], upper=True)]
+        coefs = [la._la_solve_triangular(D.T, values[idx0:idx1], lower=False)]
         for ii, row in reversed(list(enumerate(A))):
             idx1 = idx0
             idx0 -= row[ii].shape[1]
             C_sub = C[:, idx0:idx1]
             coefs = (
-                [solve_triangular(
+                [la._la_solve_triangular(
                     row[ii].T, values[idx0:idx1]-C_sub.T @ coefs[-1],
-                    upper=True)] + coefs)
-        coefs = vstack(coefs)
+                    lower=False)] + coefs)
+        coefs = la._la_vstack(coefs)
         return coefs
 
     @staticmethod
-    def _cholesky_solve(A, C, D, values):
-        gamma = MultiPeerKernel._lower_solve_triangular(A, C, D, values)
-        return MultiPeerKernel._upper_solve_triangular(A, C, D, gamma)
+    def _cholesky_solve(A, C, D, values, la):
+        gamma = MultiPeerKernel._lower_solve_triangular(A, C, D, values, la)
+        return MultiPeerKernel._upper_solve_triangular(A, C, D, gamma, la)
 
 
 class MultiLevelKernel(SpatiallyScaledMultiOutputKernel):
@@ -283,7 +266,7 @@ def _validate_kernels_and_scalings(self, kernels, scalings):
 
     def _get_kernel_combination_matrix_entry(self, samples, ii, kk):
         if ii == kk:
-            return full((samples.shape[1], 1), 1.)
+            return self._la_full((samples.shape[1], 1), 1.)
         if ii < kk:
             return None
         val = self.scalings[kk](samples)
@@ -339,7 +322,7 @@ def get_output_kernel_correlations_from_psi(self, kk):
         """
         hyp_values = self.output_kernels[kk].hyp_list.get_values()
         psi = self.output_kernels[kk]._trans.map_theta_to_spherical(hyp_values)
-        return cos(psi[1:, 1])
+        return self._la_cos(psi[1:, 1])
 
 
 class ICMKernel(LMCKernel):
@@ -350,126 +333,6 @@ def __init__(self, latent_kernel, output_kernel, noutputs):
         super().__init__([latent_kernel], [output_kernel], noutputs)
 
 
-class CombinedHyperParameter(HyperParameter):
-    # Some times it is more intuitive for the user to pass to seperate
-    # hyperparameters but the code requires them to be treated
-    # as a single hyperparameter, e.g. when set_active_opt_params
-    # that requires both user hyperparameters must trigger an action
-    # like updating of an internal variable not common to all hyperparameter
-    # classes
-    def __init__(self, hyper_params: list):
-        self.hyper_params = hyper_params
-        self.bounds = vstack([hyp.bounds for hyp in self.hyper_params])
-
-    def nvars(self):
-        return sum([hyp.nvars() for hyp in self.hyper_params])
-
-    def nactive_vars(self):
-        return sum([hyp.nactive_vars() for hyp in self.hyper_params])
-
-    def set_active_opt_params(self, active_params):
-        cnt = 0
-        for hyp in self.hyper_params:
-            hyp.set_active_opt_params(
-                active_params[cnt:cnt+hyp.nactive_vars()])
-            cnt += hyp.nactive_vars()
-
-    def get_active_opt_params(self):
-        return hstack(
-            [hyp.get_active_opt_params() for hyp in self.hyper_params])
-
-    def get_active_opt_bounds(self):
-        return vstack(
-            [hyp.get_active_opt_bounds() for hyp in self.hyper_params])
-
-    def get_values(self):
-        return hstack([hyp.get_values() for hyp in self.hyper_params])
-
-    def set_values(self, values):
-        cnt = 0
-        for hyp in self.hyper_params:
-            hyp.set_values(values[cnt:cnt+hyp.nvars()])
-            cnt += hyp.nvars()
-
-
-class SphericalCovarianceHyperParameter(CombinedHyperParameter):
-    def __init__(self, hyper_params: list):
-        super().__init__(hyper_params)
-        self.cov_matrix = None
-        self.name = "spherical_covariance"
-        self.transform = IdentityHyperParameterTransform()
-        noutputs = hyper_params[0].nvars()
-        self._trans = SphericalCorrelationTransform(noutputs)
-        self._set_covariance_matrix()
-
-    def _set_covariance_matrix(self):
-        L = self._trans.map_to_cholesky(self.get_values())
-        self.cov_matrix = L@L.T
-
-    def set_active_opt_params(self, active_params):
-        super().set_active_opt_params(active_params)
-        self._set_covariance_matrix()
-
-    def __repr__(self):
-        return "{0}(name={1}, nvars={2}, transform={3}, nactive={4})".format(
-            self.__class__.__name__, self.name, self.nvars(), self.transform,
-            self.nactive_vars())
-
-
-class SphericalCovariance():
-    def __init__(self, noutputs, radii=1, radii_bounds=[1e-1, 1],
-                 angles=np.pi/2, angle_bounds=[0, np.pi],
-                 radii_transform=IdentityHyperParameterTransform(),
-                 angle_transform=IdentityHyperParameterTransform()):
-        # Angle bounds close to zero can create zero on the digaonal
-        # E.g. for speherical coordinates sin(0) = 0
-        self.noutputs = noutputs
-        self._trans = SphericalCorrelationTransform(self.noutputs)
-        self._validate_bounds(radii_bounds, angle_bounds)
-        self._radii = HyperParameter(
-            "radii", self.noutputs, radii, radii_bounds, radii_transform)
-        self._angles = HyperParameter(
-            "angles", self._trans.ntheta-self.noutputs, angles, angle_bounds,
-            angle_transform)
-        self.hyp_list = HyperParameterList([SphericalCovarianceHyperParameter(
-            [self._radii, self._angles])])
-
-    def _validate_bounds(self, radii_bounds, angle_bounds):
-        bounds = asarray(self._trans.get_spherical_bounds())
-        # all theoretical radii_bounds are the same so just check one
-        radii_bounds = atleast1d(radii_bounds)
-        if radii_bounds.shape[0] == 2:
-            radii_bounds = repeat(radii_bounds, self.noutputs)
-        radii_bounds = radii_bounds.reshape((radii_bounds.shape[0]//2, 2))
-        if (np.any(to_numpy(radii_bounds[:, 0] < bounds[:self.noutputs, 0])) or
-                np.any(to_numpy(
-                    radii_bounds[:, 1] > bounds[:self.noutputs, 1]))):
-            raise ValueError("radii bounds are inconsistent")
-        # all theoretical angle_bounds are the same so just check one
-        angle_bounds = atleast1d(angle_bounds)
-        if angle_bounds.shape[0] == 2:
-            angle_bounds = repeat(
-                angle_bounds, self._trans.ntheta-self.noutputs)
-        angle_bounds = angle_bounds.reshape((angle_bounds.shape[0]//2, 2))
-        if (np.any(to_numpy(angle_bounds[:, 0] < bounds[self.noutputs:, 0])) or
-                np.any(to_numpy(
-                    angle_bounds[:, 1] > bounds[self.noutputs:, 1]))):
-            raise ValueError("angle bounds are inconsistent")
-
-    def get_covariance_matrix(self):
-        return self.hyp_list.hyper_params[0].cov_matrix
-
-    def __call__(self, ii, jj):
-        # chol factor must be recomputed each time even if hyp_values have not
-        # changed otherwise gradient graph becomes inconsistent
-        return self.hyp_list.hyper_params[0].cov_matrix[ii, jj]
-
-    def __repr__(self):
-        return "{0}(radii={1}, angles={2} cov={3})".format(
-            self.__class__.__name__, self._radii, self._angles,
-            self.get_covariance_matrix().detach().numpy())
-
-
 class CollaborativeKernel(LMCKernel):
     def __init__(self, latent_kernels, output_kernels, discrepancy_kernels,
                  noutputs):
diff --git a/pyapprox/surrogates/autogp/numpytrends.py b/pyapprox/surrogates/autogp/numpytrends.py
new file mode 100644
index 00000000..34c2cec5
--- /dev/null
+++ b/pyapprox/surrogates/autogp/numpytrends.py
@@ -0,0 +1,14 @@
+from pyapprox.util.linearalgebra.numpylinalg import NumpyLinAlgMixin
+from pyapprox.util.hyperparameter.numpyhyperparameter import (
+    NumpyHyperParameter, NumpyHyperParameterList,
+    NumpyIdentityHyperParameterTransform)
+from pyapprox.surrogates.autogp.trends import Monomial
+
+
+class NumpyMonomial(Monomial, NumpyLinAlgMixin):
+    def __init__(self, nvars, degree, coefs, coef_bounds,
+                 name="MonomialCoefficients"):
+        self._HyperParameter = NumpyHyperParameter
+        self._HyperParameterList = NumpyHyperParameterList
+        transform = NumpyIdentityHyperParameterTransform()
+        super().__init__(nvars, degree, coefs, coef_bounds, transform, name)
diff --git a/pyapprox/surrogates/autogp/tests/test_gaussian_process.py b/pyapprox/surrogates/autogp/tests/test_gaussian_process.py
index 336f0b59..b7f0f435 100644
--- a/pyapprox/surrogates/autogp/tests/test_gaussian_process.py
+++ b/pyapprox/surrogates/autogp/tests/test_gaussian_process.py
@@ -1,23 +1,29 @@
 import unittest
-import numpy as np
 from functools import partial
 
+import numpy as np
+from scipy import stats
+from torch.distributions import MultivariateNormal as TorchMultivariateNormal
+
 from pyapprox.util.utilities import check_gradients
-from pyapprox.surrogates.autogp.kernels import (
-    MaternKernel, Monomial, ConstantKernel, GaussianNoiseKernel)
+from pyapprox.util.linearalgebra.numpylinalg import NumpyLinAlgMixin
+from pyapprox.util.linearalgebra.torchlinalg import TorchLinAlgMixin
+from pyapprox.surrogates.autogp.torchtrends import TorchMonomial
+from pyapprox.surrogates.kernels.torchkernels import (
+    TorchMaternKernel, TorchConstantKernel, TorchGaussianNoiseKernel,
+    TorchSphericalCovariance)
 from pyapprox.surrogates.autogp.mokernels import (
-    SphericalCovariance, ICMKernel, MultiPeerKernel, CollaborativeKernel)
-from pyapprox.surrogates.autogp.hyperparameter import (
-    LogHyperParameterTransform, HyperParameter)
-from pyapprox.surrogates.autogp.exactgp import (
-    ExactGaussianProcess, MOExactGaussianProcess, MOPeerExactGaussianProcess,
-    MOICMPeerExactGaussianProcess)
+    ICMKernel, MultiPeerKernel, CollaborativeKernel)
+from pyapprox.util.hyperparameter.torchhyperparameter import (
+    TorchLogHyperParameterTransform, TorchHyperParameter)
+from pyapprox.surrogates.autogp.torchgp import (
+    TorchExactGaussianProcess, TorchInducingGaussianProcess,
+    TorchInducingSamples, TorchMOExactGaussianProcess,
+    TorchMOPeerExactGaussianProcess, TorchMOICMPeerExactGaussianProcess)
 from pyapprox.surrogates.autogp.variationalgp import (
-    InducingGaussianProcess, InducingSamples,
     _log_prob_gaussian_with_noisy_nystrom_covariance)
-from pyapprox.surrogates.autogp.transforms import (
-    IdentityValuesTransform, StandardDeviationValuesTransform)
-from pyapprox.surrogates.autogp._torch_wrappers import asarray
+from pyapprox.util.transforms.torchtransforms import (
+    TorchIdentityTransform, TorchStandardDeviationTransform)
 
 
 class TestGaussianProcess(unittest.TestCase):
@@ -25,42 +31,42 @@ def setUp(self):
         np.random.seed(1)
         pass
 
-    def _check_invert_noisy_low_rank_nystrom_approximation(self, N, M):
+    def _check_invert_noisy_low_rank_nystrom_approximation(
+            self, N, M, la, MultivariateNormal):
         noise_std = 2
-        tmp = np.random.normal(0, 1, (N, N))
+        tmp = la._la_atleast2d(np.random.normal(0, 1, (N, N)))
         C_NN = tmp.T@tmp
         C_MN = C_NN[:M]
         C_MM = C_NN[:M, :M]
-        Q = asarray(
-            C_MN.T @ np.linalg.inv(C_MM) @ C_MN + noise_std**2*np.eye(N))
+        Q = (
+            C_MN.T @ la._la_inv(C_MM) @ C_MN + noise_std**2*la._la_eye(N))
 
-        values = asarray(np.ones((N, 1)))
-        from torch.distributions import MultivariateNormal
+        values = la._la_full((N, 1), 1)
         p_y = MultivariateNormal(values[:, 0]*0, covariance_matrix=Q)
         logpdf1 = p_y.log_prob(values[:, 0])
 
-        L_UU = asarray(np.linalg.cholesky(C_MM))
+        L_UU = la._la_cholesky(C_MM)
         logpdf2 = _log_prob_gaussian_with_noisy_nystrom_covariance(
-            asarray(noise_std), L_UU, asarray(C_MN.T), values)
+            noise_std, L_UU, C_MN.T, values, la)
         assert np.allclose(logpdf1, logpdf2)
 
         if N != M:
             return
 
-        assert np.allclose(Q, C_NN + noise_std**2*np.eye(N))
+        assert np.allclose(Q, C_NN + noise_std**2*la._la_eye(N))
 
-        values = values.numpy()
-        Q_inv = np.linalg.inv(Q)
+        values = values
+        Q_inv = la._la_inv(Q)
 
-        import scipy
-        Delta = scipy.linalg.solve_triangular(
+        Delta = la._la_solve_triangular(
             L_UU, C_MN.T, lower=True)/noise_std
-        Omega = np.eye(M) + Delta@Delta.T
-        L_Omega = np.linalg.cholesky(Omega)
-        log_det = 2*np.log(np.diag(L_Omega)).sum()+2*N*np.log(noise_std)
-        gamma = scipy.linalg.solve_triangular(
+        Omega = la._la_eye(M) + Delta@Delta.T
+        L_Omega = la._la_cholesky(Omega)
+        log_det = (2*la._la_log(la._la_get_diagonal(L_Omega)).sum() +
+                   2*N*np.log(noise_std))
+        gamma = la._la_solve_triangular(
             L_Omega, Delta @ values, lower=True)
-        assert np.allclose(log_det, np.linalg.slogdet(Q)[1])
+        assert np.allclose(log_det, la._la_slogdet(Q)[1])
 
         coef = Q_inv @ values
         assert np.allclose(
@@ -69,19 +75,36 @@ def _check_invert_noisy_low_rank_nystrom_approximation(self, N, M):
 
         mll = -0.5 * (
             values.T@coef +
-            np.linalg.slogdet(Q)[1] +
+            la._la_slogdet(Q)[1] +
             N*np.log(2*np.pi)
         )
         assert np.allclose(mll, logpdf2)
 
     def test_invert_noisy_low_rank_nystrom_approximation(self):
+        # set multivariatenormal for scipy to have same api as torch
+        class NumpyMultivariateNormal():
+            def __init__(self, mean, covariance_matrix):
+                self._mvn = stats.multivariate_normal(mean, covariance_matrix)
+
+            def log_prob(self, xx):
+                return self._mvn.logpdf(xx)
+
         test_cases = [
-            [3, 2], [4, 2], [15, 6], [3, 3]]
-        for test_case in test_cases[-1:]:
+            [3, 2, NumpyLinAlgMixin(), NumpyMultivariateNormal],
+            [4, 2, NumpyLinAlgMixin(), NumpyMultivariateNormal],
+            [15, 6, NumpyLinAlgMixin(), NumpyMultivariateNormal],
+            [3, 3, NumpyLinAlgMixin(), NumpyMultivariateNormal],
+            [3, 2, TorchLinAlgMixin(), TorchMultivariateNormal],
+            [4, 2, TorchLinAlgMixin(), TorchMultivariateNormal],
+            [15, 6, TorchLinAlgMixin(), TorchMultivariateNormal],
+            [3, 3, TorchLinAlgMixin(), TorchMultivariateNormal]]
+        for test_case in test_cases:
             np.random.seed(1)
             self._check_invert_noisy_low_rank_nystrom_approximation(*test_case)
 
-    def _check_exact_gp_training(self, mean, values_trans, constant):
+    def _check_exact_gp_training(
+            self, mean, values_trans, constant, ConstantKernel, MaternKernel,
+            LogHyperParameterTransform, ExactGaussianProcess):
         nvars = 1
         if mean is not None:
             assert mean.nvars() == nvars
@@ -101,7 +124,7 @@ def fun(xx):
             return (xx**2).sum(axis=0)[:, None]
 
         ntrain_samples = 10
-        train_samples = np.linspace(-1, 1, ntrain_samples)[None, :]
+        train_samples = kernel._la_linspace(-1, 1, ntrain_samples)[None, :]
         train_values = fun(train_samples)
 
         gp.set_training_data(train_samples, train_values)
@@ -111,47 +134,53 @@ def fun(xx):
         errors = check_gradients(
             lambda x: gp._fit_objective(x[:, 0]), True, x0[:, None],
             disp=False)
+        # print(errors.min()/errors.max())
         assert errors.min()/errors.max() < 1e-6
 
         gp.fit(train_samples, train_values)
 
         ntest_samples = 5
-        test_samples = np.random.uniform(-1, 1, (nvars, ntest_samples))
+        test_samples = kernel._la_atleast2d(
+            np.random.uniform(-1, 1, (nvars, ntest_samples)))
         test_vals = fun(test_samples)
 
         gp_vals, gp_std = gp(test_samples, return_std=True)
 
         if mean is not None and mean.degree == 2:
             assert np.allclose(gp_vals, test_vals, atol=1e-14)
-            xx = np.linspace(-1, 1, 101)[None, :]
+            xx = kernel._la_linspace(-1, 1, 101)[None, :]
             assert np.allclose(gp.values_trans.map_from_canonical(
-                gp._canonical_mean(xx)), fun(xx), atol=5e-6)
+                gp._canonical_mean(xx)), fun(xx), atol=6e-5)
         else:
             assert np.allclose(gp_vals, test_vals, atol=1e-2)
 
     def test_exact_gp_training(self):
         test_cases = [
-            [None, IdentityValuesTransform(), None],
-            [Monomial(1, 2, 1.0, (-1e3, 1e3), name='mean'),
-             IdentityValuesTransform(), None],
-            [None, StandardDeviationValuesTransform(), None],
-            [Monomial(1, 2, 1.0, (-1e3, 1e3), name='mean'),
-             StandardDeviationValuesTransform(), None],
+            [None, TorchIdentityTransform(), None],
+            [TorchMonomial(1, 2, 1.0, (-1e3, 1e3), name='mean'),
+             TorchIdentityTransform(), None],
+            [None, TorchStandardDeviationTransform(trans=True), None],
+            [TorchMonomial(1, 2, 1.0, (-1e3, 1e3), name='mean'),
+             TorchStandardDeviationTransform(trans=True), None],
         ]
+        torch_classes = [
+            TorchConstantKernel, TorchMaternKernel,
+            TorchLogHyperParameterTransform, TorchExactGaussianProcess]
         for test_case in test_cases:
-            self._check_exact_gp_training(*test_case)
+            print(test_case)
+            self._check_exact_gp_training(*(test_case+torch_classes))
 
     def test_compare_with_deprecated_gp(self):
         nvars = 1
         noise = 0.0 #1
         sigma = 1
         lenscale = 0.5
-        kernel = (ConstantKernel(sigma, [np.nan, np.nan]) *
-                  MaternKernel(np.inf, lenscale, [np.nan, np.nan], nvars) +
-                  GaussianNoiseKernel(noise, [np.nan, np.nan]))
+        kernel = (TorchConstantKernel(sigma, [np.nan, np.nan]) *
+                  TorchMaternKernel(np.inf, lenscale, [np.nan, np.nan], nvars) +
+                  TorchGaussianNoiseKernel(noise, [np.nan, np.nan]))
 
-        gp = ExactGaussianProcess(
-            nvars, kernel, mean=None, values_trans=IdentityValuesTransform())
+        gp = TorchExactGaussianProcess(
+            nvars, kernel, mean=None, values_trans=TorchIdentityTransform())
 
         # def fun(xx):
         #     return (xx**2).sum(axis=0)[:, None]
@@ -165,6 +194,8 @@ def fun(xx, noisy=True):
         ntrain_samples = 6
         train_samples = np.linspace(-1, 1, ntrain_samples)[None, :]
         train_values = fun(train_samples)
+        torch_train_samples = kernel._la_atleast2d(train_samples)
+        torch_train_values = kernel._la_atleast2d(train_values)
 
         from pyapprox.surrogates.gaussianprocess.gaussian_process import (
             GaussianProcess, Matern,  ConstantKernel as CKernel, WhiteKernel)
@@ -172,9 +203,10 @@ def fun(xx, noisy=True):
                      Matern(lenscale, length_scale_bounds='fixed', nu=np.inf) +
                      WhiteKernel(noise, 'fixed'))
 
-        assert np.allclose(kernel(train_samples), pyakernel(train_samples.T))
+        assert np.allclose(kernel(torch_train_samples),
+                           pyakernel(torch_train_samples.T))
 
-        gp.fit(train_samples, train_values)
+        gp.fit(torch_train_samples, torch_train_values)
 
         pyagp = GaussianProcess(pyakernel, alpha=0.)
         pyagp.fit(train_samples, train_values)
@@ -202,22 +234,22 @@ def fun(xx, noisy=True):
     def test_variational_gp_training(self):
         ntrain_samples = 10
         nvars, ninducing_samples = 1, 5
-        kernel = MaternKernel(np.inf, 0.5, [1e-1, 1], nvars)
+        kernel = TorchMaternKernel(np.inf, 0.5, [1e-1, 1], nvars)
         inducing_samples = np.linspace(-1, 1, ninducing_samples)[None, :]
-        noise = HyperParameter(
-            'noise', 1, 1, (1e-6, 1), LogHyperParameterTransform())
-        inducing_samples = InducingSamples(
+        noise = TorchHyperParameter(
+            'noise', 1, 1, (1e-6, 1), TorchLogHyperParameterTransform())
+        inducing_samples = TorchInducingSamples(
             nvars, ninducing_samples, inducing_samples=inducing_samples,
             noise=noise)
-        values_trans = IdentityValuesTransform()
-        gp = InducingGaussianProcess(
+        values_trans = TorchIdentityTransform()
+        gp = TorchInducingGaussianProcess(
             nvars, kernel, inducing_samples,
             kernel_reg=1e-10, values_trans=values_trans)
 
         def fun(xx):
             return (xx**2).sum(axis=0)[:, None]
 
-        train_samples = np.linspace(-1, 1, ntrain_samples)[None, :]
+        train_samples = kernel._la_linspace(-1, 1, ntrain_samples)[None, :]
         train_values = fun(train_samples)
 
         gp.set_training_data(train_samples, train_values)
@@ -247,7 +279,8 @@ def fun(xx):
         # plt.show()
 
         ntest_samples = 10
-        test_samples = np.random.uniform(-1, 1, (nvars, ntest_samples))
+        test_samples = kernel._la_atleast2d(
+            np.random.uniform(-1, 1, (nvars, ntest_samples)))
         test_vals = fun(test_samples)
         gp_mu, gp_std = gp(test_samples, return_std=True)
         # print(gp_mu-test_vals)
@@ -257,20 +290,21 @@ def test_variational_gp_collapse_to_exact_gp(self):
         nvars = 1
         ntrain_samples = 6
         noise_var = 1e-8
-        kernel = (MaternKernel(np.inf, 1, [1e-1, 1], nvars))
-        values_trans = IdentityValuesTransform()
+        kernel = (TorchMaternKernel(np.inf, 1, [1e-1, 1], nvars))
+        values_trans = TorchIdentityTransform()
 
         def fun(xx):
             return (xx**2).sum(axis=0)[:, None]
 
-        train_samples = np.linspace(-1, 1, ntrain_samples)[None, :]
+        train_samples = kernel._la_linspace(-1, 1, ntrain_samples)[None, :]
         train_values = fun(train_samples)
 
         ntest_samples = 6
         test_samples = np.random.uniform(-1, 1, (nvars, ntest_samples))
 
-        exact_gp = ExactGaussianProcess(
-            nvars, kernel+GaussianNoiseKernel(noise_var, [np.nan, np.nan]),
+        exact_gp = TorchExactGaussianProcess(
+            nvars,
+            kernel+TorchGaussianNoiseKernel(noise_var, [np.nan, np.nan]),
             mean=None, values_trans=values_trans, kernel_reg=0)
         exact_gp.set_training_data(train_samples, train_values)
         exact_gp.fit(train_samples, train_values, max_nglobal_opt_iters=1)
@@ -280,16 +314,17 @@ def fun(xx):
         ninducing_samples = ntrain_samples
         # fix hyperparameters so they are not changed from exact_gp
         # or setting provided if not found in exact_gp
-        noise = HyperParameter(
+        noise = TorchHyperParameter(
             'noise_std', 1, np.sqrt(noise_var), [np.nan, np.nan],
-            LogHyperParameterTransform())
-        inducing_samples = InducingSamples(
+            TorchLogHyperParameterTransform())
+        inducing_samples = TorchInducingSamples(
             nvars, ninducing_samples, inducing_samples=inducing_samples,
-            inducing_sample_bounds=[np.nan, np.nan], noise=noise)
-        values_trans = IdentityValuesTransform()
+            inducing_sample_bounds=kernel._la_atleast1d([np.nan, np.nan]),
+            noise=noise)
+        values_trans = TorchIdentityTransform()
         # use correlation length learnt by exact gp
         vi_kernel = kernel
-        vi_gp = InducingGaussianProcess(
+        vi_gp = TorchInducingGaussianProcess(
             nvars, vi_kernel, inducing_samples,
             kernel_reg=0, values_trans=values_trans)
         vi_gp.fit(train_samples, train_values, max_nglobal_opt_iters=1)
@@ -317,8 +352,8 @@ def fun1(xx):
 
         radii, radii_bounds = np.arange(1, noutputs+1), [1, 10]
         angles = np.pi/4
-        latent_kernel = MaternKernel(np.inf, 0.5, [1e-1, 2], nvars)
-        output_kernel = SphericalCovariance(
+        latent_kernel = TorchMaternKernel(np.inf, 0.5, [1e-1, 2], nvars)
+        output_kernel = TorchSphericalCovariance(
             noutputs, radii, radii_bounds, angles=angles,
             angle_bounds=[0, np.pi])
 
@@ -326,28 +361,29 @@ def fun1(xx):
 
         nsamples_per_output = [12, 12]
         samples_per_output = [
-            np.random.uniform(-1, 1, (nvars, nsamples))
+            kernel._la_atleast2d(np.random.uniform(-1, 1, (nvars, nsamples)))
             for nsamples in nsamples_per_output]
 
         values_per_output = [
             fun(samples) for fun, samples in zip(funs, samples_per_output)]
 
-        gp = MOExactGaussianProcess(
-            nvars, kernel, mean=None, values_trans=IdentityValuesTransform(),
+        gp = TorchMOExactGaussianProcess(
+            nvars, kernel, values_trans=TorchIdentityTransform(),
             kernel_reg=1e-8)
         gp.fit(samples_per_output, values_per_output, max_nglobal_opt_iters=3)
 
         # check correlation between models is estimated correctly.
         # SphericalCovariance is not guaranteed to recover the statistical
         # correlation, but for this case it can
-        from pyapprox.util.utilities import get_correlation_from_covariance
         cov_matrix = output_kernel.get_covariance_matrix()
-        corr_matrix = get_correlation_from_covariance(cov_matrix.numpy())
-        samples = np.random.uniform(-1, 1, (1, 101))
-        values = np.hstack([fun(samples) for fun in funs])
+        corr_matrix = kernel._la_get_correlation_from_covariance(
+            cov_matrix)
+        samples = kernel._la_atleast2d(np.random.uniform(-1, 1, (1, 101)))
+        values = kernel._la_hstack([fun(samples) for fun in funs])
         assert np.allclose(
             corr_matrix,
-            get_correlation_from_covariance(np.cov(values.T, ddof=1)),
+            kernel._la_get_correlation_from_covariance(
+                kernel._la_cov(values.T, ddof=1)),
             atol=1e-2)
 
         # import matplotlib.pyplot as plt
@@ -365,10 +401,10 @@ def fun1(xx):
     def test_peer_gaussian_process(self):
         nvars, noutputs = 1, 4
         degree = 0
-        kernels = [MaternKernel(np.inf, 1.0, [1e-1, 1], nvars)
+        kernels = [TorchMaternKernel(np.inf, 1.0, [1e-1, 1], nvars)
                    for ii in range(noutputs)]
         scalings = [
-            Monomial(nvars, degree, 1, [-1, 2], name=f'scaling{ii}')
+            TorchMonomial(nvars, degree, 1, [-1, 2], name=f'scaling{ii}')
             for ii in range(noutputs-1)]
         kernel = MultiPeerKernel(kernels, scalings)
 
@@ -388,14 +424,14 @@ def target_fun(peer_funs, xx):
         # nsamples_per_output = np.array([5 for ii in range(noutputs-1)]+[4])*2
         nsamples_per_output = np.array([7 for ii in range(noutputs-1)]+[5])
         samples_per_output = [
-            np.random.uniform(-1, 1, (nvars, nsamples))
+            kernel._la_atleast2d(np.random.uniform(-1, 1, (nvars, nsamples)))
             for nsamples in nsamples_per_output]
 
         values_per_output = [
             fun(samples) for fun, samples in zip(funs, samples_per_output)]
 
-        gp = MOExactGaussianProcess(
-            nvars, kernel, mean=None, values_trans=IdentityValuesTransform(),
+        gp = TorchMOExactGaussianProcess(
+            nvars, kernel, values_trans=TorchIdentityTransform(),
             kernel_reg=0)
         gp.fit(samples_per_output, values_per_output, max_nglobal_opt_iters=3)
 
@@ -411,14 +447,14 @@ def target_fun(peer_funs, xx):
 
         # check that when using hyperparameters found by dense GP the PeerGP
         # return the same likelihood value and prediction mean and std. dev.
-        peer_gp = MOPeerExactGaussianProcess(
-            nvars, kernel, mean=None, values_trans=IdentityValuesTransform(),
+        peer_gp = TorchMOPeerExactGaussianProcess(
+            nvars, kernel, values_trans=TorchIdentityTransform(),
             kernel_reg=0)
         peer_gp.set_training_data(samples_per_output, values_per_output)
         assert np.allclose(
             gp._neg_log_likelihood_with_hyperparameter_mean(),
             peer_gp._neg_log_likelihood_with_hyperparameter_mean())
-        xx = np.linspace(-1, 1, 31)[None, :]
+        xx = kernel._la_linspace(-1, 1, 31)[None, :]
         gp_mean, gp_std = gp([xx]*noutputs, return_std=True)
         peer_gp_mean, peer_gp_std = peer_gp([xx]*noutputs, return_std=True)
         assert np.allclose(peer_gp_mean, gp_mean)
@@ -439,8 +475,8 @@ def target_fun(peer_funs, xx):
         # radii, radii_bounds = np.ones(noutputs), [1, 10]
         radii, radii_bounds = np.arange(1, 1+noutputs), [1, 10]
         angles = np.pi/2
-        latent_kernel = MaternKernel(np.inf, 0.5, [1e-1, 2], nvars)
-        output_kernel = SphericalCovariance(
+        latent_kernel = TorchMaternKernel(np.inf, 0.5, [1e-1, 2], nvars)
+        output_kernel = TorchSphericalCovariance(
             noutputs, radii, radii_bounds, angles=angles,
             angle_bounds=[0, np.pi])
 
@@ -454,15 +490,15 @@ def target_fun(peer_funs, xx):
         # nsamples_per_output = np.array([5 for ii in range(noutputs-1)]+[4])*2
         # nsamples_per_output = np.array([3 for ii in range(noutputs-1)]+[2])
         samples_per_output = [
-            np.random.uniform(-1, 1, (nvars, nsamples))
+            kernel._la_atleast2d(np.random.uniform(-1, 1, (nvars, nsamples)))
             for nsamples in nsamples_per_output]
 
         values_per_output = [
             fun(samples) for fun, samples in zip(funs, samples_per_output)]
 
-        gp = MOICMPeerExactGaussianProcess(
+        gp = TorchMOICMPeerExactGaussianProcess(
             nvars, kernel, output_kernel,
-            values_trans=IdentityValuesTransform(), kernel_reg=0)
+            values_trans=TorchIdentityTransform(), kernel_reg=0)
         gp_params = gp.hyp_list.get_active_opt_params()
 
         from pyapprox.util.utilities import check_gradients
@@ -492,7 +528,7 @@ def target_fun(peer_funs, xx):
         print(cov_matrix)
         for ii in range(2, noutputs):
             for jj in range(1, ii):
-                np.abs(cov_matrix[ii, jj]) < 1e-10
+                kernel._la_abs(cov_matrix[ii, jj]) < 1e-10
 
         # import matplotlib.pyplot as plt
         # axs = plt.subplots(
@@ -506,32 +542,34 @@ def target_fun(peer_funs, xx):
 
     def test_collaborative_gp(self):
         nvars, noutputs = 1, 4
-        def peer_fun(delta, xx):
-            return np.cos(2*np.pi*xx.T+delta)
-
-        def target_fun(peer_funs, xx):
-            return (
-                np.hstack([f(xx) for f in peer_funs]).sum(axis=1)[:, None] +
-                np.exp(-xx.T**2*2))
-            # return np.cos(2*np.pi*xx.T)
 
         radii, radii_bounds = np.ones(noutputs), [1, 2]
         angles = np.pi/4
-        latent_kernel = MaternKernel(np.inf, 0.5, [1e-1, 2], nvars)
-        output_kernel = SphericalCovariance(
+        latent_kernel = TorchMaternKernel(np.inf, 0.5, [1e-1, 2], nvars)
+        output_kernel = TorchSphericalCovariance(
             noutputs, radii, radii_bounds, angles=angles,
             angle_bounds=[0, np.pi])
 
         output_kernels = [output_kernel]
         latent_kernels = [latent_kernel]
         discrepancy_kernels = [
-            ConstantKernel(
-                0.1, (1e-1, 1), transform=LogHyperParameterTransform()) *
-            MaternKernel(np.inf, 1.0, [1e-1, 1], nvars)
+            TorchConstantKernel(
+                0.1, (1e-1, 1), transform=TorchLogHyperParameterTransform()) *
+            TorchMaternKernel(np.inf, 1.0, [1e-1, 1], nvars)
             for ii in range(noutputs)]
         co_kernel = CollaborativeKernel(
             latent_kernels, output_kernels, discrepancy_kernels, noutputs)
 
+        def peer_fun(delta, xx):
+            return latent_kernel._la_cos(2*np.pi*xx.T+delta)
+
+        def target_fun(peer_funs, xx):
+            return (
+                latent_kernel._la_hstack(
+                    [f(xx) for f in peer_funs]).sum(axis=1)[:, None] +
+                latent_kernel._la_exp(-xx.T**2*2))
+            # return np.cos(2*np.pi*xx.T)
+
         peer_deltas = np.linspace(0.2, 1, noutputs-1)
         peer_funs = [partial(peer_fun, delta) for delta in peer_deltas]
         funs = peer_funs + [partial(target_fun, peer_funs)]
@@ -540,15 +578,16 @@ def target_fun(peer_funs, xx):
         # nsamples_per_output = np.array([5 for ii in range(noutputs-1)]+[4])*2
         # nsamples_per_output = np.array([3 for ii in range(noutputs-1)]+[2])
         samples_per_output = [
-            np.random.uniform(-1, 1, (nvars, nsamples))
+            latent_kernel._la_atleast2d(
+                np.random.uniform(-1, 1, (nvars, nsamples)))
             for nsamples in nsamples_per_output]
 
         values_per_output = [
             fun(samples) for fun, samples in zip(funs, samples_per_output)]
 
-        gp = MOExactGaussianProcess(
-            nvars, co_kernel, mean=None,
-            values_trans=IdentityValuesTransform(), kernel_reg=0)
+        gp = TorchMOExactGaussianProcess(
+            nvars, co_kernel,
+            values_trans=TorchIdentityTransform(), kernel_reg=0)
         gp_params = gp.hyp_list.get_active_opt_params()
 
         gp.set_training_data(samples_per_output, values_per_output)
diff --git a/pyapprox/surrogates/autogp/tests/test_kernels.py b/pyapprox/surrogates/autogp/tests/test_kernels.py
deleted file mode 100644
index 55f1e9f6..00000000
--- a/pyapprox/surrogates/autogp/tests/test_kernels.py
+++ /dev/null
@@ -1,87 +0,0 @@
-import unittest
-import numpy as np
-import torch
-
-from pyapprox.surrogates.autogp._torch_wrappers import log
-from pyapprox.surrogates.autogp.kernels import (
-    ConstantKernel, MaternKernel, PeriodicMaternKernel)
-
-
-def approx_jacobian_3D(f, x0, epsilon=np.sqrt(np.finfo(float).eps)):
-    fval = f(x0)
-    jacobian = np.zeros((fval.shape[0], fval.shape[1], x0.shape[0]))
-    for ii in range(len(x0)):
-        dx = np.full((x0.shape[0]), 0.)
-        dx[ii] = epsilon
-        fval_perturbed = f(x0+dx)
-        jacobian[..., ii] = (fval_perturbed - fval) / epsilon
-    return jacobian
-
-
-class TestKernels(unittest.TestCase):
-    def setUp(self):
-        np.random.seed(1)
-
-    def test_kernels(self):
-        kernel_inf = MaternKernel(np.inf, 1.0, [1e-1, 1], 2)
-        values = torch.as_tensor([0.5, 0.5], dtype=torch.double)
-        kernel_inf.hyp_list.set_active_opt_params(log(values))
-        assert np.allclose(kernel_inf.hyp_list.get_values(), values)
-
-        nsamples1, nsamples2 = 5, 3
-        X = np.random.normal(0, 1, (2, nsamples1))
-        Y = np.random.normal(0, 1, (2, nsamples2))
-        assert np.allclose(kernel_inf.diag(X), np.diag(kernel_inf(X, X)))
-
-        const0 = 2.0
-        kernel_prod = kernel_inf*ConstantKernel(const0)
-        assert np.allclose(kernel_prod.diag(X), const0*kernel_inf.diag(X))
-        assert np.allclose(kernel_prod.diag(X), np.diag(kernel_prod(X, X)))
-        assert np.allclose(kernel_prod(X, Y), const0*kernel_inf(X, Y))
-
-        const1 = 3.0
-        kernel_sum = kernel_prod+ConstantKernel(const1)
-        assert np.allclose(
-            kernel_sum.diag(X), const0*kernel_inf.diag(X)+const1)
-        assert np.allclose(kernel_sum.diag(X), np.diag(kernel_sum(X, X)))
-        assert np.allclose(kernel_sum(X, Y), const0*kernel_inf(X, Y)+const1)
-
-        kernel_periodic = PeriodicMaternKernel(
-            0.5, 1.0, [1e-1, 1], 1, [1e-1, 1])
-        values = torch.as_tensor([0.5, 0.5], dtype=torch.double)
-        kernel_periodic.hyp_list.set_active_opt_params(log(values))
-        assert np.allclose(kernel_periodic.hyp_list.get_values(), values)
-        assert np.allclose(
-            kernel_periodic.diag(X), np.diag(kernel_periodic(X, X)))
-
-    def check_kernel_jacobian(self, kernel, nsamples):
-        X = np.random.uniform(-1, 1, (kernel.nvars(), nsamples))
-
-        def fun(active_params_opt):
-            if not isinstance(active_params_opt, np.ndarray):
-                active_params_opt.requires_grad = True
-            else:
-                active_params_opt = torch.as_tensor(
-                    active_params_opt, dtype=torch.double)
-            kernel.hyp_list.set_active_opt_params(active_params_opt)
-            return kernel(X)
-
-        jacobian = torch.autograd.functional.jacobian(
-            fun, kernel.hyp_list.get_active_opt_params())
-        for hyp in kernel.hyp_list.hyper_params:
-            hyp._values = hyp._values.clone().detach()
-        assert np.allclose(
-            jacobian.numpy(),
-            approx_jacobian_3D(
-                fun, kernel.hyp_list.get_active_opt_params().detach().numpy()))
-
-    def test_kernel_jacobian(self):
-        nvars, nsamples = 2, 3
-        kernel = MaternKernel(np.inf, 1.0, [1e-1, 1], nvars)
-        self.check_kernel_jacobian(kernel, nsamples)
-
-
-if __name__ == "__main__":
-    kernels_test_suite = unittest.TestLoader().loadTestsFromTestCase(
-        TestKernels)
-    unittest.TextTestRunner(verbosity=2).run(kernels_test_suite)
diff --git a/pyapprox/surrogates/autogp/tests/test_mokernels.py b/pyapprox/surrogates/autogp/tests/test_mokernels.py
index 11416ade..074e4e74 100644
--- a/pyapprox/surrogates/autogp/tests/test_mokernels.py
+++ b/pyapprox/surrogates/autogp/tests/test_mokernels.py
@@ -2,19 +2,23 @@
 import numpy as np
 import scipy
 
-from pyapprox.surrogates.autogp.kernels import (
-    Monomial, MaternKernel, ConstantKernel)
+from pyapprox.surrogates.kernels.numpykernels import (
+    NumpyMaternKernel, NumpyConstantKernel, NumpySphericalCovariance)
+from pyapprox.surrogates.kernels.torchkernels import (
+    TorchMaternKernel, TorchSphericalCovariance)
+from pyapprox.surrogates.autogp.numpytrends import NumpyMonomial
+from pyapprox.surrogates.autogp.torchtrends import TorchMonomial
 from pyapprox.surrogates.autogp.mokernels import (
     MultiLevelKernel, MultiPeerKernel, _get_recursive_scaling_matrix,
-    SphericalCovariance, ICMKernel, CollaborativeKernel)
-from pyapprox.surrogates.autogp._torch_wrappers import asarray
+    ICMKernel, CollaborativeKernel)
 
 
 class TestMultiOutputKernels(unittest.TestCase):
     def setUp(self):
         np.random.seed(1)
 
-    def _check_multilevel_kernel_scaling_matrix(self, noutputs):
+    def _check_multilevel_kernel_scaling_matrix(self, noutputs, MaternKernel,
+                                                Monomial):
         nvars, degree = 1, 0
         kernels = [
             MaternKernel(np.inf, 1.0, [1e-1, 1], nvars)
@@ -38,16 +42,20 @@ def _check_multilevel_kernel_scaling_matrix(self, noutputs):
         assert np.allclose(W_true, W)
 
     def test_multilevel_kernel_scaling_matrix(self):
-        self._check_multilevel_kernel_scaling_matrix(2)
-        self._check_multilevel_kernel_scaling_matrix(3)
-        self._check_multilevel_kernel_scaling_matrix(4)
+        for kk in range(2, 5):
+            self._check_multilevel_kernel_scaling_matrix(
+                kk, NumpyMaternKernel, NumpyMonomial)
+        for kk in range(2, 5):
+            self._check_multilevel_kernel_scaling_matrix(
+                kk, TorchMaternKernel, TorchMonomial)
 
     def _check_spatially_scaled_multioutput_kernel_covariance(
             self, kernel, samples_per_output):
         nsamples_per_output = [s.shape[1] for s in samples_per_output]
         kmat = kernel(samples_per_output)
         assert np.allclose(kmat, kmat.T)
-        assert np.allclose(np.diag(kmat), kernel.diag(samples_per_output))
+        assert np.allclose(kernel._la_get_diagonal(kmat),
+                           kernel.diag(samples_per_output))
 
         # test evaluation when two sample sets are provided
         from copy import deepcopy
@@ -58,7 +66,8 @@ def _check_spatially_scaled_multioutput_kernel_covariance(
         cnt = sum([s.shape[1] for s in samples_per_output_test])
         assert np.allclose(kmat[:cnt, :], kmat_XY)
         kmat_diag = kernel.diag(samples_per_output_test)
-        assert np.allclose(kmat_diag, np.diag(kmat[:cnt, :cnt]))
+        assert np.allclose(
+            kmat_diag, kernel._la_get_diagonal(kmat[:cnt, :cnt]))
 
         samples_per_output_test = deepcopy(samples_per_output)
         samples_per_output_test[:1] = [np.array([[]])]
@@ -67,14 +76,17 @@ def _check_spatially_scaled_multioutput_kernel_covariance(
 
         kmat_diag = kernel.diag(samples_per_output_test)
         assert np.allclose(
-            kmat_diag, np.diag(kmat[samples_per_output[0].shape[1]:,
-                                    samples_per_output[0].shape[1]:]))
+            kmat_diag, kernel._la_get_diagonal(
+                kmat[samples_per_output[0].shape[1]:,
+                     samples_per_output[0].shape[1]:]))
 
         nsamples = int(5e6)
         DD_list_0 = [
-            np.linalg.cholesky(kernel.kernels[kk](samples_per_output[0])).dot(
-                np.random.normal(
-                    0, 1, (nsamples_per_output[0], nsamples)))
+            kernel._la_atleast2d(
+                np.linalg.cholesky(
+                    kernel.kernels[kk](samples_per_output[0])).dot(
+                        np.random.normal(
+                            0, 1, (nsamples_per_output[0], nsamples))))
             for kk in range(kernel.nkernels)]
         # samples must be nested for tests to work
         DD_lists = [[DD[:nsamples_per_output[ii], :] for DD in DD_list_0]
@@ -95,18 +107,20 @@ def _check_spatially_scaled_multioutput_kernel_covariance(
                     False, True),
                 rtol=1e-2)
             for jj in range(ii+1, kernel.noutputs):
-                vals_ii = np.full((nsamples_per_output[ii], nsamples), 0.)
-                vals_jj = np.full((nsamples_per_output[jj], nsamples), 0.)
+                vals_ii = kernel._la_full(
+                    (nsamples_per_output[ii], nsamples), 0.)
+                vals_jj = kernel._la_full(
+                    (nsamples_per_output[jj], nsamples), 0.)
                 for kk in range(kernel.nkernels):
                     wmat_iikk = kernel._get_kernel_combination_matrix_entry(
                         samples_per_output[ii], ii, kk)
                     if wmat_iikk is not None:
-                        vals_ii += wmat_iikk.numpy()*DD_lists[ii][kk]
+                        vals_ii += wmat_iikk * DD_lists[ii][kk]
                 for kk in range(kernel.nkernels):
                     wmat_jjkk = kernel._get_kernel_combination_matrix_entry(
                         samples_per_output[jj], jj, kk)
                     if wmat_jjkk is not None:
-                        vals_jj += wmat_jjkk.numpy()*DD_lists[jj][kk]
+                        vals_jj += wmat_jjkk * DD_lists[jj][kk]
                 kmat_iijj = kernel._evaluate_block(
                     samples_per_output[ii], ii, samples_per_output[jj], jj,
                     False, True)
@@ -118,7 +132,8 @@ def _check_spatially_scaled_multioutput_kernel_covariance(
                 else:
                     assert np.allclose(kmat_iijj, kmat_iijj_mc,  atol=2e-3)
 
-    def _check_multioutput_kernel_3_outputs(self, nvars, degree, MOKernel):
+    def _check_multioutput_kernel_3_outputs(
+            self, nvars, degree, MOKernel, MaternKernel, Monomial):
         nsamples_per_output = [4, 3, 2]
         kernels = [MaternKernel(np.inf, 1.0, [1e-1, 1], nvars),
                    MaternKernel(np.inf, 2.0, [1e-2, 10], nvars),
@@ -127,8 +142,8 @@ def _check_multioutput_kernel_3_outputs(self, nvars, degree, MOKernel):
             Monomial(nvars, degree, 2, [-1, 2], name='scaling1'),
             Monomial(nvars, degree, -3, [-3, 3], name='scaling2')]
         kernel = MOKernel(kernels, scalings)
-        base_training_samples = np.random.uniform(
-            -1, 1, (nvars, nsamples_per_output[0]))
+        base_training_samples = kernel._la_atleast2d(
+            np.random.uniform(-1, 1, (nvars, nsamples_per_output[0])))
         # samples must be nested for tests to work
         samples_per_output = [
             base_training_samples[:, :nsamples]
@@ -138,20 +153,26 @@ def _check_multioutput_kernel_3_outputs(self, nvars, degree, MOKernel):
 
     def test_multioutput_kernels_3_outputs(self):
         test_cases = [
-            [1, 0, MultiPeerKernel],
-            [1, 1, MultiPeerKernel],
-            [2, 1, MultiPeerKernel],
-            [1, 0, MultiLevelKernel],
+            [1, 0, MultiPeerKernel, NumpyMaternKernel, NumpyMonomial],
+            [1, 1, MultiPeerKernel, NumpyMaternKernel, NumpyMonomial],
+            [2, 1, MultiPeerKernel, NumpyMaternKernel, NumpyMonomial],
+            [1, 0, MultiLevelKernel, NumpyMaternKernel, NumpyMonomial],
+            [1, 0, MultiPeerKernel, TorchMaternKernel, TorchMonomial],
+            [1, 1, MultiPeerKernel, TorchMaternKernel, TorchMonomial],
+            [2, 1, MultiPeerKernel, TorchMaternKernel, TorchMonomial],
+            [1, 0, MultiLevelKernel, TorchMaternKernel, TorchMonomial],
         ]
         for test_case in test_cases:
             np.random.seed(1)
             self._check_multioutput_kernel_3_outputs(*test_case)
 
-    def _check_coregionalization_kernel(self, noutputs):
+    def _check_coregionalization_kernel(
+            self, noutputs, MaternKernel, SphericalCovariance):
         nvars = 1
         nsamples_per_output_0 = np.arange(2, 2+noutputs)[::-1]
         latent_kernel = MaternKernel(np.inf, 1.0, [1e-1, 1], nvars)
-        radii, radii_bounds = np.arange(1, noutputs+1), [0.1, 10]
+        radii = latent_kernel._la_arange(1, noutputs+1)
+        radii_bounds = [0.1, 10]
         angles = np.pi/4
         output_kernel = SphericalCovariance(
             noutputs, radii, radii_bounds, angles=angles)
@@ -160,45 +181,47 @@ def _check_coregionalization_kernel(self, noutputs):
             -1, 1, (nvars, nsamples_per_output_0[0]))
         # samples must be nested for tests to work
         samples_per_output = [
-            base_training_samples[:, :nsamples]
+            latent_kernel._la_atleast2d(base_training_samples[:, :nsamples])
             for nsamples in nsamples_per_output_0]
         kmat_diag = kernel.diag(samples_per_output)
         kmat = kernel(samples_per_output)
-        assert np.allclose(np.diag(kmat), kmat_diag)
+        assert np.allclose(latent_kernel._la_get_diagonal(kmat), kmat_diag)
 
         cnt = 0
         for nsamples, r in zip(nsamples_per_output_0, radii):
             assert np.allclose(kmat_diag[cnt:cnt+nsamples], r**2)
             cnt += nsamples
         cmat = kernel.output_kernels[0].get_covariance_matrix()
-        from pyapprox.util.utilities import get_correlation_from_covariance
         assert np.allclose(
             kernel.get_output_kernel_correlations_from_psi(0),
-            get_correlation_from_covariance(cmat.numpy())[0, 1:])
+            kernel._la_get_correlation_from_covariance(cmat)[0, 1:])
 
         # Test that when all samples are the same the kernel matrix is
         # equivalent to kronker-product of cov_matrix with kernels[0] matrix
         nsamples_per_output_0 = np.full((noutputs, ), 2)
-        base_training_samples = np.random.uniform(
-            -1, 1, (nvars, nsamples_per_output_0[0]))
+        base_training_samples = kernel._la_atleast2d(
+            np.random.uniform(-1, 1, (nvars, nsamples_per_output_0[0])))
         samples_per_output = [
-            base_training_samples.copy()
+            kernel._la_copy(base_training_samples)
             for nsamples in nsamples_per_output_0]
         kernel = ICMKernel(latent_kernel, output_kernel, noutputs)
         kmat = kernel(samples_per_output)
         cmat = kernel.output_kernels[0].get_covariance_matrix()
         assert np.allclose(
-            kmat.numpy(), np.kron(cmat, latent_kernel(base_training_samples)),
+            kmat,
+            kernel._la_kron(cmat, latent_kernel(base_training_samples)),
             atol=1e-12)
 
     def test_coregionalization_kernel(self):
-        test_cases = [
-            [2], [3], [4], [5]
-        ]
+        test_cases = [[kk, NumpyMaternKernel, NumpySphericalCovariance]
+                      for kk in range(2, 6)]
+        test_cases += [[kk, TorchMaternKernel, TorchSphericalCovariance]
+                       for kk in range(2, 6)]
         for test_case in test_cases:
             self._check_coregionalization_kernel(*test_case)
 
-    def _check_collaborative_kernel(self, noutputs, nlatent_kernels):
+    def _check_collaborative_kernel(self, noutputs, nlatent_kernels,
+                                    MaternKernel, SphericalCovariance):
         nvars = 1
         nsamples_per_output_0 = np.arange(2, 2+noutputs)[::-1]
         latent_kernels = [
@@ -226,7 +249,14 @@ def _check_collaborative_kernel(self, noutputs, nlatent_kernels):
 
     def test_collaborative_kernel(self):
         test_cases = [
-            [2, 1], [3, 2], [4, 2], [5, 1]
+            [2, 1, NumpyMaternKernel, NumpySphericalCovariance],
+            [3, 2, NumpyMaternKernel, NumpySphericalCovariance],
+            [4, 2, NumpyMaternKernel, NumpySphericalCovariance],
+            [5, 1, NumpyMaternKernel, NumpySphericalCovariance],
+            [2, 1, TorchMaternKernel, TorchSphericalCovariance],
+            [3, 2, TorchMaternKernel, TorchSphericalCovariance],
+            [4, 2, TorchMaternKernel, TorchSphericalCovariance],
+            [5, 1, TorchMaternKernel, TorchSphericalCovariance]
         ]
         for test_case in test_cases:
             self._check_collaborative_kernel(*test_case)
@@ -236,10 +266,10 @@ def test_collaborative_kernel(self):
         # are only functions of a unique latent kernel
         noutputs, nvars = 3, 1
         peer_kernels = [
-            MaternKernel(np.inf, 1.0, [1e-1, 1], nvars)
+            NumpyMaternKernel(np.inf, 1.0, [1e-1, 1], nvars)
             for kk in range(noutputs)]
         scalings = [
-            Monomial(nvars, 0, 1, [-1, 2], name=f'scaling{ii}')
+            NumpyMonomial(nvars, 0, 1, [-1, 2], name=f'scaling{ii}')
             for ii in range(noutputs-1)]
         peer_kernel = MultiPeerKernel(peer_kernels, scalings)
         nsamples_per_output_0 = np.arange(2, 2+noutputs)[::-1]
@@ -251,7 +281,7 @@ def test_collaborative_kernel(self):
             for nsamples in nsamples_per_output_0]
         peer_kmat = peer_kernel(samples_per_output)
 
-        class HackKernel(SphericalCovariance):
+        class HackKernel(NumpySphericalCovariance):
             def __init__(self, noutputs, cov_mat):
                 super().__init__(noutputs)
                 self.cov_mat = cov_mat
@@ -272,15 +302,16 @@ def __call__(self, ii, jj):
         output_kernels = [
             HackKernel(noutputs, cov_mat) for cov_mat in cov_mats]
         discrepancy_kernels = [
-            ConstantKernel(0)*MaternKernel(np.inf, 1.0, [1e-1, 1], nvars)
+            NumpyConstantKernel(0)*NumpyMaternKernel(
+                np.inf, 1.0, [1e-1, 1], nvars)
             for ii in range(noutputs-1)] + [
-                    MaternKernel(np.inf, 1.0, [1e-1, 1], nvars)]
+                    NumpyMaternKernel(np.inf, 1.0, [1e-1, 1], nvars)]
         co_kernel = CollaborativeKernel(
             latent_kernels, output_kernels, discrepancy_kernels, noutputs)
         co_kmat = co_kernel(samples_per_output)
         assert np.allclose(peer_kmat, co_kmat)
 
-    def test_block_cholesky(self):
+    def _check_block_cholesky(self, MaternKernel, Monomial):
         noutputs, nvars, degree = 4, 1, 0
         nsamples_per_output = np.arange(2, 2+noutputs)[::-1]
         kernels = [MaternKernel(np.inf, 1.0, [1e-1, 1], nvars)
@@ -289,8 +320,8 @@ def test_block_cholesky(self):
             Monomial(nvars, degree, 2, [-1, 2], name=f'scaling{ii}')
             for ii in range(noutputs-1)]
         kernel = MultiPeerKernel(kernels, scalings)
-        base_training_samples = np.random.uniform(
-            -1, 1, (nvars, nsamples_per_output[0]))
+        base_training_samples = kernel._la_atleast2d(np.random.uniform(
+            -1, 1, (nvars, nsamples_per_output[0])))
         # samples must be nested for tests to work
         samples_per_output = [
             base_training_samples[:, :nsamples]
@@ -310,15 +341,21 @@ def test_block_cholesky(self):
             kernel._logdet(*L_blocks), np.linalg.slogdet(kmat)[1])
         values = np.random.normal(0, 1, (L.shape[1], 1))
         assert np.allclose(
-            kernel._lower_solve_triangular(*L_blocks, asarray(values)),
+            kernel._lower_solve_triangular(*L_blocks, values),
             scipy.linalg.solve_triangular(L, values, lower=True))
         assert np.allclose(
-            kernel._upper_solve_triangular(*L_blocks, asarray(values)),
+            kernel._upper_solve_triangular(*L_blocks, values),
             scipy.linalg.solve_triangular(L.T, values, lower=False))
         assert np.allclose(
-            kernel._cholesky_solve(*L_blocks, asarray(values)),
+            kernel._cholesky_solve(*L_blocks, values),
             np.linalg.inv(kmat) @ values)
 
+    def test_block_cholesky(self):
+        test_cases = [
+            [NumpyMaternKernel, NumpyMonomial]]
+        for case in test_cases:
+            self._check_block_cholesky(*case)
+
 
 if __name__ == "__main__":
     multioutput_kernels_test_suite = (
diff --git a/pyapprox/surrogates/autogp/torchgp.py b/pyapprox/surrogates/autogp/torchgp.py
new file mode 100644
index 00000000..2224646f
--- /dev/null
+++ b/pyapprox/surrogates/autogp/torchgp.py
@@ -0,0 +1,136 @@
+import torch
+
+from pyapprox.surrogates.kernels._kernels import Kernel
+from pyapprox.surrogates.autogp.trends import Monomial
+from pyapprox.util.transforms._transforms import Transform
+from pyapprox.surrogates.autogp.exactgp import (
+    ExactGaussianProcess, MOExactGaussianProcess, MOPeerExactGaussianProcess,
+    MOICMPeerExactGaussianProcess)
+from pyapprox.util.linearalgebra.torchlinalg import TorchLinAlgMixin
+from pyapprox.util.transforms.torchtransforms import (
+    TorchIdentityTransform, TorchStandardDeviationTransform)
+from pyapprox.surrogates.autogp.variationalgp import (
+    InducingSamples, InducingGaussianProcess)
+from pyapprox.util.hyperparameter.torchhyperparameter import (
+    TorchHyperParameter, TorchHyperParameterList,
+    TorchIdentityHyperParameterTransform, TorchLogHyperParameterTransform)
+
+
+class TorchGPFitMixin:
+    def _fit_objective(self, active_opt_params_np):
+        # todo change to follow call and jacobian api used by new optimize
+        # classes
+
+        # this is only pplace where torch should be called explicitly
+        # as we are using its functionality to compute the gradient of their
+        # negative log likelihood. We could replace this with a grad
+        # computed analytically
+        active_opt_params = torch.tensor(
+            active_opt_params_np, dtype=torch.double, requires_grad=True)
+        nll = self._neg_log_likelihood(active_opt_params)
+        nll.backward()
+        val = nll.item()
+        # copy is needed because zero_ is called
+        nll_grad = active_opt_params.grad.detach().numpy().copy()
+        active_opt_params.grad.zero_()
+        # must set requires grad to False after gradient is computed
+        # otherwise when evaluate_posterior will fail because it will
+        # still think the hyper_params require grad. Extra copies could be
+        # avoided by doing this after fit is complete. However then fit
+        # needs to know when torch is being used
+        for hyp in self.hyp_list.hyper_params:
+            hyp.detach()
+        return val, nll_grad
+
+
+class TorchExactGaussianProcess(
+        TorchLinAlgMixin, TorchGPFitMixin, ExactGaussianProcess):
+    # Mixins must be first if defining an abstractmethod
+    # And init of all nonmixin classes must be called explicitly in this
+    # classes __init__
+    def __init__(self,
+                 nvars: int,
+                 kernel: Kernel,
+                 var_trans: Transform = TorchIdentityTransform(),
+                 values_trans: Transform = TorchStandardDeviationTransform(
+                     trans=True),
+                 mean: Monomial = None,
+                 kernel_reg: float = 0):
+        super().__init__(nvars, kernel, var_trans, values_trans,
+                         mean, kernel_reg)
+
+
+class TorchMOExactGaussianProcess(
+        TorchLinAlgMixin, TorchGPFitMixin, MOExactGaussianProcess):
+    # Mixins must be first if defining an abstractmethod
+    # And init of all nonmixin classes must be called explicitly in this
+    # classes __init__
+    def __init__(self,
+                 nvars: int,
+                 kernel: Kernel = None,
+                 var_trans: Transform = TorchIdentityTransform(),
+                 values_trans: Transform = TorchStandardDeviationTransform(
+                     trans=True),
+                 kernel_reg: float = 0):
+        super().__init__(nvars, kernel, var_trans, values_trans,
+                         None, kernel_reg)
+
+
+class TorchMOPeerExactGaussianProcess(
+        TorchLinAlgMixin, TorchGPFitMixin, MOPeerExactGaussianProcess):
+    # Mixins must be first if defining an abstractmethod
+    # And init of all nonmixin classes must be called explicitly in this
+    # classes __init__
+    def __init__(self,
+                 nvars: int,
+                 kernel: Kernel,
+                 var_trans: Transform = TorchIdentityTransform(),
+                 values_trans: Transform = TorchStandardDeviationTransform(
+                     trans=True),
+                 kernel_reg: float = 0):
+        super().__init__(nvars, kernel, var_trans, values_trans,
+                         None, kernel_reg)
+
+
+class TorchMOICMPeerExactGaussianProcess(
+        TorchLinAlgMixin, TorchGPFitMixin, MOICMPeerExactGaussianProcess):
+    # Mixins must be first if defining an abstractmethod
+    # And init of all nonmixin classes must be called explicitly in this
+    # classes __init__
+    def __init__(self,
+                 nvars: int,
+                 kernel: Kernel,
+                 output_kernel: Kernel,
+                 var_trans: Transform = TorchIdentityTransform(),
+                 values_trans: Transform = TorchStandardDeviationTransform(
+                     trans=True),
+                 kernel_reg: float = 0):
+        super().__init__(nvars, kernel, output_kernel, var_trans, values_trans,
+                         kernel_reg)
+
+
+class TorchInducingSamples(InducingSamples, TorchLinAlgMixin):
+    def __init__(self, nvars, ninducing_samples, inducing_variable=None,
+                 inducing_samples=None, inducing_sample_bounds=None,
+                 noise=None):
+        self._HyperParameter = TorchHyperParameter
+        self._HyperParameterList = TorchHyperParameterList
+        self._IdentityHyperParameterTransform = (
+            TorchIdentityHyperParameterTransform)
+        self._LogHyperParameterTransform = (
+            TorchLogHyperParameterTransform)
+        super().__init__(nvars, ninducing_samples, inducing_variable,
+                         inducing_samples, inducing_sample_bounds,
+                         noise)
+
+
+class TorchInducingGaussianProcess(
+        TorchLinAlgMixin, TorchGPFitMixin, InducingGaussianProcess):
+    def __init__(self, nvars,
+                 kernel,
+                 inducing_samples,
+                 kernel_reg=0,
+                 var_trans=TorchIdentityTransform(),
+                 values_trans=TorchStandardDeviationTransform(trans=True)):
+        super().__init__(nvars, kernel, inducing_samples,
+                         var_trans, values_trans, kernel_reg)
diff --git a/pyapprox/surrogates/autogp/torchtrends.py b/pyapprox/surrogates/autogp/torchtrends.py
new file mode 100644
index 00000000..2aaf01af
--- /dev/null
+++ b/pyapprox/surrogates/autogp/torchtrends.py
@@ -0,0 +1,14 @@
+from pyapprox.util.linearalgebra.torchlinalg import TorchLinAlgMixin
+from pyapprox.util.hyperparameter.torchhyperparameter import (
+    TorchHyperParameter, TorchHyperParameterList,
+    TorchIdentityHyperParameterTransform)
+from pyapprox.surrogates.autogp.trends import Monomial
+
+
+class TorchMonomial(Monomial, TorchLinAlgMixin):
+    def __init__(self, nvars, degree, coefs, coef_bounds,
+                 name="MonomialCoefficients"):
+        self._HyperParameter = TorchHyperParameter
+        self._HyperParameterList = TorchHyperParameterList
+        transform = TorchIdentityHyperParameterTransform()
+        super().__init__(nvars, degree, coefs, coef_bounds, transform, name)
diff --git a/pyapprox/surrogates/autogp/trends.py b/pyapprox/surrogates/autogp/trends.py
new file mode 100644
index 00000000..b8d036ce
--- /dev/null
+++ b/pyapprox/surrogates/autogp/trends.py
@@ -0,0 +1,56 @@
+from pyapprox.surrogates.interp.indexing import compute_hyperbolic_indices
+
+
+class Monomial():
+    def __init__(self, nvars, degree, coefs, coef_bounds,
+                 transform, name="MonomialCoefficients"):
+        self._nvars = nvars
+        self.degree = degree
+        self.indices = compute_hyperbolic_indices(self.nvars(), self.degree)
+        self.nterms = self.indices.shape[1]
+        self._coef = self._HyperParameter(
+            name, self.nterms, coefs, coef_bounds, transform)
+        self.hyp_list = self._HyperParameterList([self._coef])
+
+    def nvars(self):
+        return self._nvars
+
+    def _univariate_monomial_basis_matrix(self, max_level, samples):
+        assert samples.ndim == 1
+        basis_matrix = samples[:, None]**self._la_arange(max_level+1)[None, :]
+        return basis_matrix
+
+    def _monomial_basis_matrix(self, indices, samples):
+        num_vars, num_indices = indices.shape
+        assert samples.shape[0] == num_vars
+        num_samples = samples.shape[1]
+
+        deriv_order = 0
+        basis_matrix = self._la_empty(
+            ((1+deriv_order*num_vars)*num_samples, num_indices))
+        basis_vals_1d = [self._univariate_monomial_basis_matrix(
+            indices[0, :].max(), samples[0, :])]
+        basis_matrix[:num_samples, :] = basis_vals_1d[0][:, indices[0, :]]
+        for dd in range(1, num_vars):
+            basis_vals_1d.append(self._univariate_monomial_basis_matrix(
+                indices[dd, :].max(), samples[dd, :]))
+            basis_matrix[:num_samples, :] *= (
+                basis_vals_1d[dd][:, indices[dd, :]])
+        return basis_matrix
+
+    def basis_matrix(self, samples):
+        return self._monomial_basis_matrix(self.indices, samples)
+
+    def __call__(self, samples):
+        if self.degree == 0:
+            vals = self._la_empty((samples.shape[1], 1))
+            vals[:] = self._coef.get_values()
+            return vals
+        basis_mat = self.basis_matrix(samples)
+        vals = basis_mat @ self._coef.get_values()
+        return vals[:, None]
+
+    def __repr__(self):
+        return "{0}(name={1}, nvars={2}, degree={3}, nterms={4})".format(
+            self.__class__.__name__, self._coef.name, self.nvars(),
+            self.degree, self.nterms)
diff --git a/pyapprox/surrogates/autogp/variationalgp.py b/pyapprox/surrogates/autogp/variationalgp.py
index 9e3949cb..c8acca1a 100644
--- a/pyapprox/surrogates/autogp/variationalgp.py
+++ b/pyapprox/surrogates/autogp/variationalgp.py
@@ -1,31 +1,25 @@
-from torch.distributions import MultivariateNormal
 from typing import Tuple
+
 from scipy import stats
 import numpy as np
+#TODO remove torch and switch to LinAlgMixin
 
 from pyapprox.expdesign.low_discrepancy_sequences import halton_sequence
 from pyapprox.variables.transforms import IndependentMarginalsVariable
-
-from pyapprox.surrogates.autogp._torch_wrappers import (
-    inv, eye, multidot, trace, sqrt, cholesky, solve_triangular, asarray,
-    log, repeat)
-from pyapprox.surrogates.autogp.hyperparameter import (
-    HyperParameter, HyperParameterList, IdentityHyperParameterTransform,
-    LogHyperParameterTransform)
 from pyapprox.surrogates.autogp.exactgp import ExactGaussianProcess
-from pyapprox.surrogates.autogp._torch_wrappers import (
-    diag, full)
-from pyapprox.surrogates.autogp.kernels import Kernel, SumKernel
+from pyapprox.surrogates.kernels._kernels import Kernel, SumKernel
 
 
 def _log_prob_gaussian_with_noisy_nystrom_covariance(
-        noise_std, L_UU, K_XU, values):
+        noise_std, L_UU, K_XU, values, la):
     N, M = K_XU.shape
-    Delta = solve_triangular(L_UU, K_XU.T)/noise_std
-    Omega = eye(M) + Delta@Delta.T
-    L_Omega = cholesky(Omega)
-    log_det = 2*log(L_Omega.diag()).sum()+2*N*log(noise_std)
-    gamma = solve_triangular(L_Omega, Delta @ values)
+    Delta = la._la_solve_triangular(L_UU, K_XU.T)/noise_std
+    Omega = la._la_eye(M) + Delta@Delta.T
+    L_Omega = la._la_cholesky(Omega)
+    log_det = (2*la._la_log(la._la_get_diagonal(L_Omega)).sum() +
+               2*N*la._la_log(la._la_atleast1d(
+                   noise_std)))
+    gamma = la._la_solve_triangular(L_Omega, Delta @ values)
     log_pdf = -0.5*(N*np.log(2*np.pi)+log_det+(values.T@values -
                     gamma.T@gamma)/noise_std**2)
     return log_pdf
@@ -33,7 +27,7 @@ def _log_prob_gaussian_with_noisy_nystrom_covariance(
 # see Alvarez Efficient Multioutput Gaussian Processes through Variational Inducing Kernels for details how to generaize from noise covariance sigma^2I to \Sigma
 
 
-class InducingSamples():
+class InducingSamples:
     def __init__(self, nvars, ninducing_samples, inducing_variable=None,
                  inducing_samples=None, inducing_sample_bounds=None,
                  noise=None):
@@ -44,16 +38,17 @@ def __init__(self, nvars, ninducing_samples, inducing_variable=None,
         (self.inducing_variable, self.init_inducing_samples,
          inducing_sample_bounds) = self._init_inducing_samples(
              inducing_variable, inducing_samples, inducing_sample_bounds)
-        self._inducing_samples = HyperParameter(
+        self._inducing_samples = self._HyperParameter(
             "inducing_samples", self.nvars*self.ninducing_samples,
             self.init_inducing_samples.flatten(),
             inducing_sample_bounds.flatten(),
-            IdentityHyperParameterTransform())
+            self._IdentityHyperParameterTransform())
         if noise is None:
-            noise = HyperParameter(
-                'noise', 1, 1e-2, (1e-15, 1e3), LogHyperParameterTransform())
+            noise = self._HyperParameter(
+                'noise', 1, 1e-2, (1e-15, 1e3),
+                self._LogHyperParameterTransform())
         self._noise = noise
-        self.hyp_list = HyperParameterList(
+        self.hyp_list = self._HyperParameterList(
             [self._noise, self._inducing_samples])
 
     def _init_inducing_samples(self, inducing_variable, inducing_samples,
@@ -74,11 +69,11 @@ def _init_inducing_samples(self, inducing_variable, inducing_samples,
             inducing_sample_bounds = inducing_variable.get_statistics(
                 "interval", 1.)
         else:
-            inducing_sample_bounds = asarray(inducing_sample_bounds)
+            inducing_sample_bounds = inducing_sample_bounds
             if inducing_sample_bounds.ndim == 1:
                 if inducing_sample_bounds.shape[0] != 2:
                     raise ValueError(msg)
-                inducing_sample_bounds = repeat(
+                inducing_sample_bounds = self._la_repeat(
                     inducing_sample_bounds, self.ninducing_samples).reshape(
                         self.ninducing_samples, 2)
         if (inducing_sample_bounds.shape !=
@@ -108,14 +103,15 @@ class InducingGaussianProcess(ExactGaussianProcess):
     larger than the “actual” noise in a way that is proportional to the
     inaccuracy of the approximation
     """
-    def __init__(self, nvars: int,
-                 kernel: Kernel,
-                 inducing_samples: InducingSamples,
-                 kernel_reg: float = 0,
-                 var_trans=None,
-                 values_trans=None):
-        super().__init__(nvars, kernel, kernel_reg, var_trans,
-                         values_trans)
+    def __init__(self,
+                 nvars,
+                 kernel,
+                 inducing_samples,
+                 var_trans,
+                 values_trans,
+                 kernel_reg):
+        super().__init__(nvars, kernel, var_trans, values_trans, None,
+                         kernel_reg)
 
         if isinstance(kernel, SumKernel):
             # TODO check that sumkernel is return when using
@@ -137,7 +133,7 @@ def _K_XU(self) -> Tuple:
     def _K_UU(self) -> Tuple:
         inducing_samples = self.inducing_samples.get_samples()
         kmat = self.kernel(inducing_samples, inducing_samples)
-        kmat = kmat + eye(kmat.shape[0])*float(self.kernel_reg)
+        kmat = kmat + self._la_eye(kmat.shape[0])*float(self.kernel_reg)
         return kmat
 
     def _training_kernel_matrix(self):
@@ -172,14 +168,15 @@ def _neg_log_likelihood(self, active_opt_params):
         K_UU = self._K_UU()
         # if the following line throws a ValueError it is likely
         # because self.noise is to small. If so adjust noise bounds
-        L_UU = cholesky(K_UU)
+        L_UU = self._la_cholesky(K_UU)
         mll = _log_prob_gaussian_with_noisy_nystrom_covariance(
-            noise_std, L_UU, K_XU, self.canonical_train_values)
+            noise_std, L_UU, K_XU, self.canonical_train_values, self)
         # add a regularization term to regularize variance noting that
         # trace of matrix sum is sum of traces
         K_XX_diag = self.kernel.diag(self.canonical_train_samples)
-        tmp = solve_triangular(L_UU, K_XU.T)
-        K_tilde_trace = K_XX_diag.sum() - trace(multidot((tmp.T, tmp)))
+        tmp = self._la_solve_triangular(L_UU, K_XU.T)
+        K_tilde_trace = K_XX_diag.sum() - self._la_trace(
+            self._la_multidot((tmp.T, tmp)))
         mll -= 1/(2*noise_std**2) * K_tilde_trace
         return -mll
 
@@ -188,18 +185,19 @@ def _evaluate_posterior(self, Z, return_std):
         K_XU = self._K_XU()
         K_UU = self._K_UU()
 
-        K_UU_inv = inv(K_UU)
+        K_UU_inv = self._la_inv(K_UU)
         # Titsias 2009 Equation (6) B = Kuu_inv*A(Kuu_inv)
         # A is s Equation (11) in Vanderwilk 2020
         # which depends on \Sigma defined below Equation (10) Titsias
         # which we call Lambda below
-        Lambda = K_UU_inv + multidot((
+        Lambda = K_UU_inv + self._la_multidot((
             K_UU_inv, K_XU.T, K_XU, K_UU_inv/noise_std**2))
-        Lambda_inv = inv(Lambda)
-        m = multidot((Lambda_inv, K_UU_inv, K_XU.T,
-                      self.canonical_train_values.squeeze()/noise_std**2))
+        Lambda_inv = self._la_inv(Lambda)
+        m = self._la_multidot((
+            Lambda_inv, K_UU_inv, K_XU.T,
+            self.canonical_train_values.squeeze()/noise_std**2))
 
-        #TODO replace lamnda inv with use of cholesky factors
+        # TODO replace lamnda inv with use of cholesky factors
 
         K_ZU = self.kernel(
             Z, self.inducing_samples.get_samples())
@@ -207,14 +205,16 @@ def _evaluate_posterior(self, Z, return_std):
 
         # Equation (6) in Titsias 2009 or
         # Equation (11) in Vanderwilk 2020
-        mu = multidot((K_ZU, K_UU_inv, m))
+        mu = self._la_multidot((K_ZU, K_UU_inv, m))
 
         if not return_std:
             return mu
 
         # The following is from Equation (6) in Titsias 2009 and
         # Equation (11) in Vanderwilk 2020 where Lambda^{-1} = S
-        sigma = (K_ZZ - multidot((K_ZU, K_UU_inv, K_ZU.T)) +
-                 multidot((K_ZU, K_UU_inv, Lambda_inv, K_UU_inv, K_ZU.T)))
-        return mu[:, None],  sqrt(diag(sigma))[:, None]
+        sigma = (K_ZZ - self._la_multidot((K_ZU, K_UU_inv, K_ZU.T)) +
+                 self._la_multidot(
+                     (K_ZU, K_UU_inv, Lambda_inv, K_UU_inv, K_ZU.T)))
+        return mu[:, None],  self._la_sqrt(
+            self._la_get_diagonal(sigma))[:, None]
         # return mu[:, None],  (diag(sigma))[:, None]
diff --git a/pyapprox/surrogates/kernels/__init__.py b/pyapprox/surrogates/kernels/__init__.py
new file mode 100644
index 00000000..e69de29b
diff --git a/pyapprox/surrogates/kernels/_kernels.py b/pyapprox/surrogates/kernels/_kernels.py
new file mode 100644
index 00000000..dd46cc54
--- /dev/null
+++ b/pyapprox/surrogates/kernels/_kernels.py
@@ -0,0 +1,289 @@
+from abc import ABC, abstractmethod
+import math
+from pyapprox.util.hyperparameter._hyperparameter import CombinedHyperParameter
+
+
+class Kernel(ABC):
+    def diag(self, X1):
+        """Return the diagonal of the kernel matrix."""
+        return self._la_get_diagonal(self(X1))
+
+    @abstractmethod
+    def __call__(self, X1, X2=None):
+        raise NotImplementedError()
+
+    def __mul__(self, kernel):
+        return ProductKernel(self, kernel)
+
+    def __add__(self, kernel):
+        return SumKernel(self, kernel)
+
+    def __repr__(self):
+        return "{0}({1}, la={2})".format(
+            self.__class__.__name__, self.hyp_list._short_repr(), self._la)
+
+
+class CompositionKernel(Kernel):
+    def __init__(self, kernel1, kernel2):
+        self.kernel1 = kernel1
+        self.kernel2 = kernel2
+        self.hyp_list = kernel1.hyp_list+kernel2.hyp_list
+
+        # make linear algebra functions accessible via product_kernel._la_
+        for attr in dir(kernel1):
+            if len(attr) >= 4 and attr[:4] == "_la_":
+                setattr(self, attr, getattr(self.kernel1, attr))
+
+    def nvars(self):
+        if hasattr(self.kernel1, "nvars"):
+            return self.kernel1.nvars()
+        return self.kernel2.nvars()
+
+
+class ProductKernel(CompositionKernel):
+    def diag(self, X1):
+        return self.kernel1.diag(X1) * self.kernel2.diag(X1)
+
+    def __repr__(self):
+        return "{0} * {1}".format(self.kernel1, self.kernel2)
+
+    def __call__(self, X1, X2=None):
+        return self.kernel1(X1, X2) * self.kernel2(X1, X2)
+
+    def jacobian(self, X):
+        Kmat1 = self.kernel1(X)
+        Kmat2 = self.kernel2(X)
+        jac1 = self.kernel1.jacobian(X)
+        jac2 = self.kernel2.jacobian(X)
+        return self._la_dstack(
+            [jac1*Kmat2[..., None], jac2*Kmat1[..., None]])
+
+
+class SumKernel(CompositionKernel):
+    def diag(self, X1):
+        return self.kernel1.diag(X1) + self.kernel2.diag(X1)
+
+    def __repr__(self):
+        return "{0} + {1}".format(self.kernel1, self.kernel2)
+
+    def __call__(self, X1, X2=None):
+        return self.kernel1(X1, X2) + self.kernel2(X1, X2)
+
+    def jacobian(self, X):
+        jac1 = self.kernel1.jacobian(X)
+        jac2 = self.kernel2.jacobian(X)
+        return self._la_dstack([jac1, jac2])
+
+
+class MaternKernel(Kernel):
+    def __init__(self, nu: float,
+                 lenscale, lenscale_bounds, nvars: int,
+                 transform):
+        """The matern kernel for varying levels of smoothness."""
+        self._nvars = nvars
+        self.nu = nu
+        self._lenscale = self._HyperParameter(
+            "lenscale", nvars, lenscale, lenscale_bounds, transform)
+        self.hyp_list = self._HyperParameterList([self._lenscale])
+
+    def diag(self, X1):
+        return self._la_full((X1.shape[1],), 1)
+
+    def _eval_distance_form(self, distances):
+        if self.nu == self._la_inf():
+            return self._la_exp(-(distances**2)/2.)
+        if self.nu == 5/2:
+            tmp = self._la_sqrt(5)*distances
+            return (1.0+tmp+tmp**2/3.)*self._la_exp(-tmp)
+        if self.nu == 3/2:
+            tmp = self._la_sqrt(3)*distances
+            return (1.+tmp)*self._la_exp(-tmp)
+        if self.nu == 1/2:
+            return self._la_exp(-distances)
+        raise ValueError("Matern kernel with nu={0} not supported".format(
+            self.nu))
+
+    def __call__(self, X1, X2=None):
+        lenscale = self._lenscale.get_values()
+        if X2 is None:
+            X2 = X1
+        distances = self._la_cdist(X1.T/lenscale, X2.T/lenscale)
+        return self._eval_distance_form(distances)
+
+    def nvars(self):
+        return self._nvars
+
+
+class ConstantKernel(Kernel):
+    def __init__(self, constant, transform, constant_bounds=None):
+        if constant_bounds is None:
+            constant_bounds = [-self._la_inf(), self._la_inf()]
+        self._const = self._HyperParameter(
+            "const", 1, constant, constant_bounds, transform)
+        self.hyp_list = self._HyperParameterList([self._const])
+
+    def diag(self, X1):
+        return self._la_full((X1.shape[1],), self.hyp_list.get_values()[0])
+
+    def __call__(self, X1, X2=None):
+        if X2 is None:
+            X2 = X1
+        # full does not work when const value requires grad
+        # return full((X1.shape[1], X2.shape[1]), self._const.get_values()[0])
+        const = self._la_empty((X1.shape[1], X2.shape[1]))
+        const[:] = self._const.get_values()[0]
+        return const
+
+
+class GaussianNoiseKernel(Kernel):
+    def __init__(self, constant, transform, constant_bounds=None):
+        self._const = self._HyperParameter(
+            "const", 1, constant, constant_bounds, transform)
+        self.hyp_list = self._HyperParameterList([self._const])
+
+    def diag(self, X):
+        return self._la_full((X.shape[1],), self.hyp_list.get_values()[0])
+
+    def __call__(self, X, Y=None):
+        if Y is None:
+            return self._const.get_values()[0]*self._la_eye(X.shape[1])
+        # full does not work when const value requires grad
+        # return full((X.shape[1], Y.shape[1]), self._const.get_values()[0])
+        const = self._la_full((X.shape[1], Y.shape[1]), 0.)
+        return const
+
+
+class PeriodicMaternKernel(MaternKernel):
+    def __init__(self,
+                 nu: float,
+                 period,
+                 period_bounds,
+                 lenscale,
+                 lenscale_bounds,
+                 lenscale_transform,
+                 period_transform):
+        super().__init__(nu, lenscale, lenscale_bounds, 1, lenscale_transform)
+        self._period = self._HyperParameter(
+            "period", 1, lenscale, lenscale_bounds, period_transform)
+        self.hyp_list += self._HyperParameterList([self._period])
+
+    def __call__(self, X, Y=None):
+        if Y is None:
+            Y = X
+        lenscale = self._lenscale.get_values()
+        period = self._period.get_values()
+        distances = self._la_cdist(X.T/period, Y.T/period)/lenscale
+        return super()._eval_distance_form(distances)
+
+    def diag(self, X):
+        return super().diag(X)
+
+
+class HilbertSchmidtKernel(Kernel):
+    def __init__(self,
+                 basis,
+                 weights,
+                 weight_bounds,
+                 transform,
+                 normalize: bool = False):
+        self._nvars = basis.nvars()
+        self._basis = basis
+        self._nterms = basis.nterms()**2
+        self._normalize = normalize
+        self._weights = self._HyperParameter(
+            "weights", self._nterms, weights, weight_bounds,
+            transform)
+        self.hyp_list = self._HyperParameterList([self._weights])
+
+    def _get_weights(self):
+        return self._la_reshape(
+            self._weights.get_values(),
+            (self._basis.nterms(), self._basis.nterms()))
+
+    def __call__(self, X1, X2=None):
+        weights = self._get_weights()
+        if X2 is None:
+            X2 = X1
+        X1basis_mat = self._basis(X1)
+        X2basis_mat = self._basis(X2)
+        if self._normalize:
+            X1basis_mat /= self._la_norm(X1basis_mat, axis=1)[:, None]
+            X2basis_mat /= self._la_norm(X2basis_mat, axis=1)[:, None]
+        K = (X1basis_mat @ weights) @ X2basis_mat.T
+        return K
+
+
+class SphericalCovarianceHyperParameter(CombinedHyperParameter):
+    def __init__(self, hyper_params: list):
+        super().__init__(hyper_params)
+        self.cov_matrix = None
+        self.name = "spherical_covariance"
+        self.transform = self._IdentityHyperParameterTransform()
+        noutputs = hyper_params[0].nvars()
+        self._trans = self._SphericalCorrelationTransform(noutputs)
+        self._set_covariance_matrix()
+
+    def _set_covariance_matrix(self):
+        L = self._trans.map_to_cholesky(self.get_values())
+        self.cov_matrix = L@L.T
+
+    def set_active_opt_params(self, active_params):
+        super().set_active_opt_params(active_params)
+        self._set_covariance_matrix()
+
+    def __repr__(self):
+        return "{0}(name={1}, nvars={2}, transform={3}, nactive={4})".format(
+            self.__class__.__name__, self.name, self.nvars(), self.transform,
+            self.nactive_vars())
+
+
+class SphericalCovariance:
+    def __init__(self, noutputs, radii_transform, angle_transform,
+                 radii=1, radii_bounds=[1e-1, 1],
+                 angles=math.pi/2, angle_bounds=[0, math.pi]):
+        # Angle bounds close to zero can create zero on the digaonal
+        # E.g. for speherical coordinates sin(0) = 0
+        self.noutputs = noutputs
+        self._trans = self._SphericalCorrelationTransform(self.noutputs)
+        self._validate_bounds(radii_bounds, angle_bounds)
+        self._radii = self._HyperParameter(
+            "radii", self.noutputs, radii, radii_bounds, radii_transform)
+        self._angles = self._HyperParameter(
+            "angles", self._trans.ntheta-self.noutputs, angles, angle_bounds,
+            angle_transform)
+        self.hyp_list = self._HyperParameterList(
+            [self._SphericalCovarianceHyperParameter(
+                [self._radii, self._angles])])
+
+    def _validate_bounds(self, radii_bounds, angle_bounds):
+        bounds = self._trans.get_spherical_bounds()
+        # all theoretical radii_bounds are the same so just check one
+        radii_bounds = self._la_atleast1d(radii_bounds)
+        if radii_bounds.shape[0] == 2:
+            radii_bounds = self._la_repeat(radii_bounds, self.noutputs)
+        radii_bounds = radii_bounds.reshape((radii_bounds.shape[0]//2, 2))
+        if (self._la_any(radii_bounds[:, 0] < bounds[:self.noutputs, 0]) or
+                self._la_any(radii_bounds[:, 1] > bounds[:self.noutputs, 1])):
+            raise ValueError("radii bounds are inconsistent")
+        # all theoretical angle_bounds are the same so just check one
+        angle_bounds = self._la_atleast1d(angle_bounds)
+        if angle_bounds.shape[0] == 2:
+            angle_bounds = self._la_repeat(
+                angle_bounds, self._trans.ntheta-self.noutputs)
+        angle_bounds = angle_bounds.reshape((angle_bounds.shape[0]//2, 2))
+        if (self._la_any(angle_bounds[:, 0] < bounds[self.noutputs:, 0]) or
+                self._la_any(angle_bounds[:, 1] > bounds[self.noutputs:, 1])):
+            raise ValueError("angle bounds are inconsistent")
+
+    def get_covariance_matrix(self):
+        return self.hyp_list.hyper_params[0].cov_matrix
+
+    def __call__(self, ii, jj):
+        # chol factor must be recomputed each time even if hyp_values have not
+        # changed otherwise gradient graph becomes inconsistent
+        return self.hyp_list.hyper_params[0].cov_matrix[ii, jj]
+
+    def __repr__(self):
+        return "{0}(radii={1}, angles={2} cov={3})".format(
+            self.__class__.__name__, self._radii, self._angles,
+            self.get_covariance_matrix().detach().numpy())
diff --git a/pyapprox/surrogates/kernels/numpykernels.py b/pyapprox/surrogates/kernels/numpykernels.py
new file mode 100644
index 00000000..01019ead
--- /dev/null
+++ b/pyapprox/surrogates/kernels/numpykernels.py
@@ -0,0 +1,75 @@
+import math
+
+from pyapprox.util.linearalgebra.numpylinalg import NumpyLinAlgMixin
+from pyapprox.surrogates.kernels._kernels import (
+    ConstantKernel, GaussianNoiseKernel, MaternKernel, PeriodicMaternKernel,
+    SphericalCovariance, SphericalCovarianceHyperParameter)
+from pyapprox.util.hyperparameter.numpyhyperparameter import (
+    NumpyIdentityHyperParameterTransform, NumpyLogHyperParameterTransform,
+    NumpyHyperParameter, NumpyHyperParameterList)
+from pyapprox.util.transforms.numpytransforms import (
+    NumpySphericalCorrelationTransform)
+
+
+class NumpyConstantKernel(ConstantKernel, NumpyLinAlgMixin):
+    def __init__(self, constant, constant_bounds=None,
+                 transform=NumpyIdentityHyperParameterTransform()):
+        self._HyperParameter = NumpyHyperParameter
+        self._HyperParameterList = NumpyHyperParameterList
+        super().__init__(constant, transform, constant_bounds)
+
+
+class NumpyGaussianNoiseKernel(GaussianNoiseKernel, NumpyLinAlgMixin):
+    def __init__(self, constant, constant_bounds=None):
+        self._HyperParameter = NumpyHyperParameter
+        self._HyperParameterList = NumpyHyperParameterList
+        super().__init__(
+            constant, NumpyLogHyperParameterTransform(), constant_bounds)
+
+
+class NumpyMaternKernel(MaternKernel, NumpyLinAlgMixin):
+    def __init__(self, nu: float,
+                 lenscale, lenscale_bounds, nvars: int):
+        self._HyperParameter = NumpyHyperParameter
+        self._HyperParameterList = NumpyHyperParameterList
+        super().__init__(nu, lenscale, lenscale_bounds, nvars,
+                         NumpyLogHyperParameterTransform())
+
+
+class NumpyPeriodicMaternKernel(PeriodicMaternKernel, NumpyLinAlgMixin):
+    def __init__(self, nu: float, period, period_bounds,
+                 lenscale, lenscale_bounds):
+        self._HyperParameter = NumpyHyperParameter
+        self._HyperParameterList = NumpyHyperParameterList
+        super().__init__(
+            nu, period, period_bounds, lenscale, lenscale_bounds,
+            NumpyLogHyperParameterTransform(),
+            NumpyLogHyperParameterTransform())
+
+
+class NumpySphericalCovarianceHyperParameter(
+        SphericalCovarianceHyperParameter, NumpyLinAlgMixin):
+    def __init__(self, hyper_params):
+        self._SphericalCorrelationTransform = (
+            NumpySphericalCorrelationTransform)
+        self._IdentityHyperParameterTransform = (
+            NumpyIdentityHyperParameterTransform)
+        super().__init__(hyper_params)
+
+
+class NumpySphericalCovariance(SphericalCovariance, NumpyLinAlgMixin):
+    def __init__(self, noutputs,
+                 radii=1, radii_bounds=[1e-1, 1],
+                 angles=math.pi/2, angle_bounds=[0, math.pi],
+                 radii_transform=NumpyIdentityHyperParameterTransform(),
+                 angle_transform=NumpyIdentityHyperParameterTransform()):
+        self._SphericalCorrelationTransform = (
+            NumpySphericalCorrelationTransform)
+        self._HyperParameter = NumpyHyperParameter
+        self._HyperParameterList = NumpyHyperParameterList
+        self._SphericalCovarianceHyperParameter = (
+            NumpySphericalCovarianceHyperParameter)
+        self._IdentityHyperParameterTransform = (
+            NumpyIdentityHyperParameterTransform)
+        super().__init__(noutputs, radii_transform, angle_transform,
+                         radii, radii_bounds, angles, angle_bounds)
diff --git a/pyapprox/surrogates/kernels/tests/__init__.py b/pyapprox/surrogates/kernels/tests/__init__.py
new file mode 100644
index 00000000..e69de29b
diff --git a/pyapprox/surrogates/kernels/tests/test_kernels.py b/pyapprox/surrogates/kernels/tests/test_kernels.py
new file mode 100644
index 00000000..9ba6579b
--- /dev/null
+++ b/pyapprox/surrogates/kernels/tests/test_kernels.py
@@ -0,0 +1,120 @@
+import unittest
+import numpy as np
+
+from pyapprox.surrogates.kernels.numpykernels import (
+    NumpyConstantKernel, NumpyMaternKernel, NumpyPeriodicMaternKernel,
+    NumpyGaussianNoiseKernel)
+from pyapprox.surrogates.kernels.torchkernels import (
+    TorchMaternKernel, TorchPeriodicMaternKernel,
+    TorchConstantKernel, TorchGaussianNoiseKernel)
+from pyapprox.util.hyperparameter.numpyhyperparameter import (
+    NumpyIdentityHyperParameterTransform, NumpyLogHyperParameterTransform)
+
+
+def approx_jacobian_3D(f, x0, epsilon=np.sqrt(np.finfo(float).eps)):
+    fval = f(x0)
+    jacobian = np.zeros((fval.shape[0], fval.shape[1], x0.shape[0]))
+    for ii in range(len(x0)):
+        dx = np.full((x0.shape[0]), 0.)
+        dx[ii] = epsilon
+        fval_perturbed = f(x0+dx)
+        jacobian[..., ii] = (fval_perturbed - fval) / epsilon
+    return jacobian
+
+
+class TestKernels(unittest.TestCase):
+    def setUp(self):
+        np.random.seed(1)
+
+    def _check_kernels(self, MaternKernel, ConstantKernel,
+                       PeriodicMaternKernel):
+        kernel_inf = MaternKernel(np.inf, 1.0, [1e-1, 1], 2)
+        values = kernel_inf._la_atleast1d([0.5, 0.5])
+        kernel_inf.hyp_list.set_active_opt_params(kernel_inf._la_log(values))
+        assert np.allclose(kernel_inf.hyp_list.get_values(), values)
+
+        nsamples1, nsamples2 = 5, 3
+        X = np.random.normal(0, 1, (2, nsamples1))
+        Y = np.random.normal(0, 1, (2, nsamples2))
+        assert np.allclose(
+            kernel_inf.diag(X), kernel_inf._la_get_diagonal(kernel_inf(X, X)))
+
+        const0 = 2.0
+        kernel_prod = kernel_inf*ConstantKernel(const0)
+        assert np.allclose(kernel_prod.diag(X), const0*kernel_inf.diag(X))
+        assert np.allclose(
+            kernel_prod.diag(X),
+            kernel_inf._la_get_diagonal(kernel_prod(X, X)))
+        assert np.allclose(kernel_prod(X, Y), const0*kernel_inf(X, Y))
+
+        const1 = 3.0
+        kernel_sum = kernel_prod+ConstantKernel(const1)
+        assert np.allclose(
+            kernel_sum.diag(X), const0*kernel_inf.diag(X)+const1)
+        assert np.allclose(
+            kernel_sum.diag(X), kernel_prod._la_get_diagonal(kernel_sum(X, X)))
+        assert np.allclose(kernel_sum(X, Y), const0*kernel_inf(X, Y)+const1)
+
+        kernel_periodic = PeriodicMaternKernel(
+            0.5, 1.0, [1e-1, 1], 1, [1e-1, 1])
+        values = kernel_periodic._la_atleast1d([0.5, 0.5])
+        kernel_periodic.hyp_list.set_active_opt_params(
+            kernel_periodic._la_log(values))
+        assert np.allclose(kernel_periodic.hyp_list.get_values(), values)
+        assert np.allclose(
+            kernel_periodic.diag(X), kernel_periodic._la_get_diagonal(
+                kernel_periodic(X, X)))
+
+    def test_kernels(self):
+        test_cases = [
+            [NumpyMaternKernel, NumpyConstantKernel,
+             NumpyPeriodicMaternKernel],
+            [TorchMaternKernel, TorchConstantKernel,
+             TorchPeriodicMaternKernel]]
+        for case in test_cases:
+            self._check_kernels(*case)
+
+    def check_kernel_jacobian(self, torch_kernel, np_kernel, nsamples):
+        X = np.random.uniform(-1, 1, (torch_kernel.nvars(), nsamples))
+        torch_jacobian = torch_kernel.jacobian(torch_kernel._la_atleast2d(X))
+        for hyp in torch_kernel.hyp_list.hyper_params:
+            hyp._values = hyp._values.clone().detach()
+
+        def fun(active_params_opt):
+            np_kernel.hyp_list.set_active_opt_params(active_params_opt)
+            return np_kernel(X)
+        assert np.allclose(
+            torch_jacobian.numpy(),
+            approx_jacobian_3D(
+                fun, np_kernel.hyp_list.get_active_opt_params()))
+
+    def test_kernel_jacobian(self):
+        nvars, nsamples = 2, 3
+        torch_kernel = TorchMaternKernel(np.inf, 1.0, [1e-1, 1], nvars)
+        np_kernel = NumpyMaternKernel(
+            np.inf, 1.0, [1e-1, 1], nvars)
+        self.check_kernel_jacobian(torch_kernel, np_kernel, nsamples)
+
+        const = 1
+        torch_kernel = (TorchConstantKernel(const) *
+                        TorchMaternKernel(np.inf, 1.0, [1e-1, 1], nvars))
+        np_kernel = (
+            NumpyConstantKernel(const) *
+            NumpyMaternKernel(np.inf, 1.0, [1e-1, 1], nvars))
+        self.check_kernel_jacobian(torch_kernel, np_kernel, nsamples)
+
+        const = 1
+        torch_kernel = (
+            TorchMaternKernel(np.inf, 1.0, [1e-1, 1], nvars) +
+            TorchGaussianNoiseKernel(1, [1e-2, 10]))
+        np_kernel = (
+            NumpyMaternKernel(
+                np.inf, 1.0, [1e-1, 1], nvars) +
+            NumpyGaussianNoiseKernel(1, [1e-2, 10]))
+        self.check_kernel_jacobian(torch_kernel, np_kernel, nsamples)
+
+
+if __name__ == "__main__":
+    kernels_test_suite = unittest.TestLoader().loadTestsFromTestCase(
+        TestKernels)
+    unittest.TextTestRunner(verbosity=2).run(kernels_test_suite)
diff --git a/pyapprox/surrogates/kernels/torchkernels.py b/pyapprox/surrogates/kernels/torchkernels.py
new file mode 100644
index 00000000..96a4869f
--- /dev/null
+++ b/pyapprox/surrogates/kernels/torchkernels.py
@@ -0,0 +1,91 @@
+import math
+
+import torch
+
+from pyapprox.util.linearalgebra.torchlinalg import TorchLinAlgMixin
+from pyapprox.util.hyperparameter.torchhyperparameter import (
+    TorchIdentityHyperParameterTransform, TorchLogHyperParameterTransform,
+    TorchHyperParameter, TorchHyperParameterList)
+from pyapprox.surrogates.kernels._kernels import (
+    MaternKernel, ConstantKernel, GaussianNoiseKernel, PeriodicMaternKernel,
+    SphericalCovariance, SphericalCovarianceHyperParameter)
+from pyapprox.util.transforms.torchtransforms import (
+    TorchSphericalCorrelationTransform)
+
+
+class TorchAutogradMixin:
+    def _autograd_fun(self, active_params_opt):
+        active_params_opt.requires_grad = True
+        self.hyp_list.set_active_opt_params(active_params_opt)
+        return self(self._X)
+
+    def jacobian(self, X):
+        self._X = X
+        return torch.autograd.functional.jacobian(
+            self._autograd_fun, self.hyp_list.get_active_opt_params())
+
+
+class TorchConstantKernel(
+        ConstantKernel, TorchAutogradMixin, TorchLinAlgMixin):
+    def __init__(self, constant, constant_bounds=None,
+                 transform=TorchIdentityHyperParameterTransform()):
+        self._HyperParameter = TorchHyperParameter
+        self._HyperParameterList = TorchHyperParameterList
+        super().__init__(constant, transform, constant_bounds)
+
+
+class TorchGaussianNoiseKernel(
+        GaussianNoiseKernel, TorchAutogradMixin, TorchLinAlgMixin):
+    def __init__(self, constant, constant_bounds=None):
+        self._HyperParameter = TorchHyperParameter
+        self._HyperParameterList = TorchHyperParameterList
+        super().__init__(
+            constant, TorchLogHyperParameterTransform(), constant_bounds)
+
+
+class TorchMaternKernel(MaternKernel, TorchAutogradMixin, TorchLinAlgMixin):
+    def __init__(self, nu: float,
+                 lenscale, lenscale_bounds, nvars: int):
+        self._HyperParameter = TorchHyperParameter
+        self._HyperParameterList = TorchHyperParameterList
+        super().__init__(nu, lenscale, lenscale_bounds, nvars,
+                         TorchLogHyperParameterTransform())
+
+
+class TorchPeriodicMaternKernel(PeriodicMaternKernel, TorchLinAlgMixin):
+    def __init__(self, nu: float, period, period_bounds,
+                 lenscale, lenscale_bounds):
+        self._HyperParameter = TorchHyperParameter
+        self._HyperParameterList = TorchHyperParameterList
+        super().__init__(
+            nu, period, period_bounds, lenscale, lenscale_bounds,
+            TorchLogHyperParameterTransform(),
+            TorchLogHyperParameterTransform())
+
+
+class TorchSphericalCovarianceHyperParameter(
+        SphericalCovarianceHyperParameter, TorchLinAlgMixin):
+    def __init__(self, hyper_params):
+        self._SphericalCorrelationTransform = (
+            TorchSphericalCorrelationTransform)
+        self._IdentityHyperParameterTransform = (
+            TorchIdentityHyperParameterTransform)
+        super().__init__(hyper_params)
+
+
+class TorchSphericalCovariance(SphericalCovariance, TorchLinAlgMixin):
+    def __init__(self, noutputs,
+                 radii=1, radii_bounds=[1e-1, 1],
+                 angles=math.pi/2, angle_bounds=[0, math.pi],
+                 radii_transform=TorchIdentityHyperParameterTransform(),
+                 angle_transform=TorchIdentityHyperParameterTransform()):
+        self._SphericalCorrelationTransform = (
+            TorchSphericalCorrelationTransform)
+        self._HyperParameter = TorchHyperParameter
+        self._HyperParameterList = TorchHyperParameterList
+        self._SphericalCovarianceHyperParameter = (
+            TorchSphericalCovarianceHyperParameter)
+        self._IdentityHyperParameterTransform = (
+            TorchIdentityHyperParameterTransform)
+        super().__init__(noutputs, radii_transform, angle_transform,
+                         radii, radii_bounds, angles, angle_bounds)
diff --git a/pyapprox/util/hyperparameter/__init__.py b/pyapprox/util/hyperparameter/__init__.py
new file mode 100644
index 00000000..e69de29b
diff --git a/pyapprox/util/hyperparameter/_hyperparameter.py b/pyapprox/util/hyperparameter/_hyperparameter.py
new file mode 100644
index 00000000..663a32c4
--- /dev/null
+++ b/pyapprox/util/hyperparameter/_hyperparameter.py
@@ -0,0 +1,241 @@
+from abc import ABC, abstractmethod
+
+
+class HyperParameterTransform(ABC):
+    @abstractmethod
+    def to_opt_space(self, params):
+        raise NotImplementedError
+
+    @abstractmethod
+    def from_opt_space(self, params):
+        raise NotImplementedError
+
+    def __repr__(self):
+        return "{0}".format(self.__class__.__name__)
+
+
+class IdentityHyperParameterTransform(HyperParameterTransform):
+    def to_opt_space(self, params):
+        return params
+
+    def from_opt_space(self, params):
+        return params
+
+
+class LogHyperParameterTransform(HyperParameterTransform):
+    def to_opt_space(self, params):
+        return self._la_log(params)
+
+    def from_opt_space(self, params):
+        return self._la_exp(params)
+
+
+class HyperParameter:
+    def __init__(self, name: str, nvars: int,
+                 values, bounds,
+                 transform: HyperParameterTransform):
+        """A possibly vector-valued hyper-parameter to be used with
+        optimization."""
+        self.name = name
+        self._nvars = nvars
+        self.transform = transform
+        self._values = self._la_atleast1d(values)
+        if self._values.shape[0] == 1:
+            self._values = self._la_repeat(self._values, self.nvars())
+        if self._values.ndim == 2:
+            raise ValueError("values is not a 1D array")
+        if self._values.shape[0] != self.nvars():
+            raise ValueError(
+                "values shape {0} inconsistent with nvars {1}".format(
+                    self._values.shape, self._nvars()))
+        self.bounds = self._la_atleast1d(bounds)
+        if self.bounds.shape[0] == 2:
+            self.bounds = self._la_repeat(self.bounds, self.nvars())
+        if self.bounds.shape[0] != 2*self.nvars():
+            msg = "bounds shape {0} inconsistent with 2*nvars={1}".format(
+                self.bounds.shape, 2*self.nvars())
+            raise ValueError(msg)
+        self.bounds = self._la_reshape(
+            self.bounds, (self.bounds.shape[0]//2, 2))
+        if self._la_where(
+                (self._values < self.bounds[:, 0]) |
+                (self._values > self.bounds[:, 1]))[0].shape[0] > 0:
+            raise ValueError("values outside bounds")
+        self._active_indices = self._la_tointeger(self._la_atleast1d(
+            self._la_arange(self.nvars())[~self._la_isnan(self.bounds[:, 0])]))
+
+    def nvars(self):
+        """Return the number of hyperparameters."""
+        return self._nvars
+
+    def nactive_vars(self):
+        """Return the number of active (to be optinized) hyperparameters."""
+        return self._active_indices.shape[0]
+
+    def set_active_opt_params(self, active_params):
+        """Set the values of the active parameters in the optimization space.
+        """
+        # The copy ensures that the error
+        # "a leaf Variable that requires grad is being used in an in-place
+        # operation is not thrown
+        self._values = self._la_copy(self._values)
+        self._values[self._active_indices] = self.transform.from_opt_space(
+            active_params)
+
+    def get_active_opt_params(self):
+        """Get the values of the active parameters in the optimization space.
+        """
+        return self.transform.to_opt_space(self._values[self._active_indices])
+
+    def get_active_opt_bounds(self):
+        """Set the bounds of the active parameters in the optimization space.
+        """
+        return self.transform.to_opt_space(
+            self.bounds[self._active_indices, :])
+
+    def get_values(self):
+        """Get the values of the parameters in the user space."""
+        return self._values
+
+    def set_values(self, values):
+        """Set the values of the parameters in the user space."""
+        self._values = values
+
+    def _short_repr(self):
+        if self.nvars() > 5:
+            return "{0}:nvars={1}".format(self.name, self.nvars())
+
+        return "{0}={1}".format(
+            self.name,
+            "["+", ".join(map("{0:.2g}".format, self._values))+"]")
+
+    def __repr__(self):
+        if self.nvars() > 5:
+            return (
+                "{0}(name={1}, nvars={2}, transform={3}, nactive={4})".format(
+                    self.__class__.__name__, self.name, self.nvars(),
+                    self.transform, self.nactive_vars()))
+        return "{0}(name={1}, values={2}, transform={3}, active={4})".format(
+            self.__class__.__name__, self.name,
+            "["+", ".join(map("{0:.2g}".format, self.get_values()))+"]",
+            self.transform,
+            "["+", ".join(map("{0}".format, self._active_indices))+"]")
+
+    def detach(self):
+        """Detach the hyperparameter values from the computational graph if
+        in use."""
+        self.set_values(self._la_detach(self.get_values()))
+
+
+class HyperParameterList:
+    def __init__(self, hyper_params: list):
+        """A list of hyper-parameters to be used with optimization."""
+        self.hyper_params = hyper_params
+
+    def set_active_opt_params(self, active_params):
+        """Set the values of the active parameters in the optimization space.
+        """
+        cnt = 0
+        for hyp in self.hyper_params:
+            hyp.set_active_opt_params(
+                active_params[cnt:cnt+hyp.nactive_vars()])
+            cnt += hyp.nactive_vars()
+
+    def nactive_vars(self):
+        """Return the number of active (to be optinized) hyperparameters."""
+        cnt = 0
+        for hyp in self.hyper_params:
+            cnt += hyp.nactive_vars()
+        return cnt
+
+    def get_active_opt_params(self):
+        """Get the values of the active parameters in the optimization space.
+        """
+        return self._la_hstack(
+            [hyp.get_active_opt_params() for hyp in self.hyper_params])
+
+    def get_active_opt_bounds(self):
+        """Get the values of the active parameters in the optimization space.
+        """
+        return self._la_vstack(
+            [hyp.get_active_opt_bounds() for hyp in self.hyper_params])
+
+    def get_values(self):
+        """Get the values of the parameters in the user space."""
+        return self._la_hstack([hyp.get_values() for hyp in self.hyper_params])
+
+    def __add__(self, hyp_list):
+        # self.__class__ must be because of the use of mixin with derived
+        # classes
+        return self.__class__(self.hyper_params+hyp_list.hyper_params)
+
+    def __radd__(self, hyp_list):
+        if hyp_list == 0:
+            # for when sum is called over list of HyperParameterLists
+            return self
+        return self.__class__(hyp_list.hyper_params+self.hyper_params)
+
+    def _short_repr(self):
+        # simpler representation used when printing kernels
+        return (
+            ", ".join(
+                map("{0}".format,
+                    [hyp._short_repr() for hyp in self.hyper_params])))
+
+    def __repr__(self):
+        return ("{0}(".format(self.__class__.__name__) +
+                ",\n\t\t   ".join(map("{0}".format, self.hyper_params))+")")
+
+
+class CombinedHyperParameter(HyperParameter):
+    # Some times it is more intuitive for the user to pass to separate
+    # hyperparameters but the code requires them to be treated
+    # as a single hyperparameter, e.g. when set_active_opt_params
+    # that requires both user hyperparameters must trigger an action
+    # like updating of an internal variable not common to all hyperparameter
+    # classes
+    def __init__(self, hyper_params: list):
+        self.hyper_params = hyper_params
+        self.bounds = self._la_vstack(
+            [hyp.bounds for hyp in self.hyper_params])
+
+    def nvars(self):
+        return sum([hyp.nvars() for hyp in self.hyper_params])
+
+    def nactive_vars(self):
+        return sum([hyp.nactive_vars() for hyp in self.hyper_params])
+
+    def set_active_opt_params(self, active_params):
+        cnt = 0
+        for hyp in self.hyper_params:
+            hyp.set_active_opt_params(
+                active_params[cnt:cnt+hyp.nactive_vars()])
+            cnt += hyp.nactive_vars()
+
+    def get_active_opt_params(self):
+        return self._la_hstack(
+            [hyp.get_active_opt_params() for hyp in self.hyper_params])
+
+    def get_active_opt_bounds(self):
+        return self._la_vstack(
+            [hyp.get_active_opt_bounds() for hyp in self.hyper_params])
+
+    def get_values(self):
+        return self._la_hstack([hyp.get_values() for hyp in self.hyper_params])
+
+    def set_values(self, values):
+        cnt = 0
+        for hyp in self.hyper_params:
+            hyp.set_values(values[cnt:cnt+hyp.nvars()])
+            cnt += hyp.nvars()
+
+
+
+# this requires import torch which we want to avoid unless user asks for it
+# def create_hyperparamter(backendname: str = 'numpy'):
+#     backends = {"numpy": NumpyLinearAlgebraBackend,
+#                 "torch": TorchLinearAlgebraBackend}
+#     if backendname not in backends:
+#         raise ValueError("{0} not supported. Select from {1}".format(
+#             backendname, list(backends.keys())))
+#     return backends[backendname]
diff --git a/pyapprox/util/hyperparameter/numpyhyperparameter.py b/pyapprox/util/hyperparameter/numpyhyperparameter.py
new file mode 100644
index 00000000..7e3c4df8
--- /dev/null
+++ b/pyapprox/util/hyperparameter/numpyhyperparameter.py
@@ -0,0 +1,22 @@
+from pyapprox.util.linearalgebra.numpylinalg import NumpyLinAlgMixin
+from pyapprox.util.hyperparameter._hyperparameter import (
+    IdentityHyperParameterTransform, LogHyperParameterTransform,
+    HyperParameter, HyperParameterList)
+
+
+class NumpyIdentityHyperParameterTransform(
+        IdentityHyperParameterTransform, NumpyLinAlgMixin):
+    pass
+
+
+class NumpyLogHyperParameterTransform(
+        LogHyperParameterTransform, NumpyLinAlgMixin):
+    pass
+
+
+class NumpyHyperParameter(HyperParameter, NumpyLinAlgMixin):
+    pass
+
+
+class NumpyHyperParameterList(HyperParameterList, NumpyLinAlgMixin):
+    pass
diff --git a/pyapprox/util/hyperparameter/torchhyperparameter.py b/pyapprox/util/hyperparameter/torchhyperparameter.py
new file mode 100644
index 00000000..1fae606d
--- /dev/null
+++ b/pyapprox/util/hyperparameter/torchhyperparameter.py
@@ -0,0 +1,22 @@
+from pyapprox.util.linearalgebra.torchlinalg import TorchLinAlgMixin
+from pyapprox.util.hyperparameter._hyperparameter import (
+    IdentityHyperParameterTransform, LogHyperParameterTransform,
+    HyperParameter, HyperParameterList)
+
+
+class TorchIdentityHyperParameterTransform(
+        IdentityHyperParameterTransform, TorchLinAlgMixin):
+    pass
+
+
+class TorchLogHyperParameterTransform(
+        LogHyperParameterTransform, TorchLinAlgMixin):
+    pass
+
+
+class TorchHyperParameter(HyperParameter, TorchLinAlgMixin):
+    pass
+
+
+class TorchHyperParameterList(HyperParameterList, TorchLinAlgMixin):
+    pass
diff --git a/pyapprox/util/linearalgebra/__init__.py b/pyapprox/util/linearalgebra/__init__.py
new file mode 100644
index 00000000..e69de29b
diff --git a/pyapprox/util/linearalgebra/linalgbase.py b/pyapprox/util/linearalgebra/linalgbase.py
new file mode 100644
index 00000000..9843e074
--- /dev/null
+++ b/pyapprox/util/linearalgebra/linalgbase.py
@@ -0,0 +1,258 @@
+from abc import ABC, abstractmethod
+
+
+class LinAlgMixin(ABC):
+    """Abstract base class for linear algebra operations.
+
+    Designed to not need a call to __init__."""
+
+    @abstractmethod
+    def _la_dot(self, Amat, Bmat):
+        """Compute the dot product of two matrices."""
+        raise NotImplementedError
+
+    @abstractmethod
+    def _la_eye(self, nrows: int):
+        """Return the identity matrix."""
+        raise NotImplementedError
+
+    @abstractmethod
+    def _la_inv(self, mat):
+        """Compute the inverse of a matrix."""
+        raise NotImplementedError
+
+    @abstractmethod
+    def _la_cholesky(self, mat):
+        """Compute the cholesky factorization of a matrix."""
+        raise NotImplementedError
+
+    def _la_cholesky_solve(self, chol, bvec, lower: bool = True):
+        """Solve the linear equation A x = b for x,
+        using the cholesky factorization of A."""
+        raise NotImplementedError
+
+    @abstractmethod
+    def _la_solve_triangular(self, Amat, bvec, lower: bool = True):
+        """Solve the linear equation A x = b for x,
+        when A is a triangular matrix."""
+        raise NotImplementedError
+
+    @abstractmethod
+    def _la_full(self, *args):
+        """Return a matrix with all values set to fill_value"""
+        raise NotImplementedError
+
+    @abstractmethod
+    def _la_empty(self, *args):
+        """Return a matrix with uniitialized values"""
+        raise NotImplementedError
+
+    @abstractmethod
+    def _la_exp(self, matrix):
+        """Apply exponential element wise to a matrix."""
+        raise NotImplementedError
+
+    @abstractmethod
+    def _la_sqrt(self, matrix):
+        """Apply sqrt element wise to a matrix."""
+        raise NotImplementedError
+
+    @abstractmethod
+    def _la_cos(self, matrix):
+        """Apply cos element wise to a matrix."""
+        raise NotImplementedError
+
+    @abstractmethod
+    def _la_arccos(self, matrix):
+        """Apply arccos element wise to a matrix."""
+        raise NotImplementedError
+
+    @abstractmethod
+    def _la_sin(self, matrix):
+        """Apply sin element wise to a matrix."""
+        raise NotImplementedError
+
+    @abstractmethod
+    def _la_log(self, matrix):
+        """Apply log element wise to a matrix."""
+        raise NotImplementedError
+
+    @abstractmethod
+    def _la_multidot(self, matrix_list):
+        """Compute the dot product of multiple matrices."""
+        raise NotImplementedError
+
+    @abstractmethod
+    def _la_prod(self, matrix_list, axis=None):
+        """Compute the product of a matrix along a given axis."""
+        raise NotImplementedError
+
+    @abstractmethod
+    def _la_hstack(self, arrays):
+        """Stack arrays horizontally (column wise)."""
+        raise NotImplementedError
+
+    @abstractmethod
+    def _la_vstack(self, arrays):
+        """Stack arrays vertically (row wise)."""
+        raise NotImplementedError
+
+    @abstractmethod
+    def _la_dstack(self, arrays):
+        """Stack arrays along third axis."""
+        raise NotImplementedError
+
+    @abstractmethod
+    def _la_arange(self, *args):
+        """Return equidistant values within a given interval."""
+        raise NotImplementedError
+
+    @abstractmethod
+    def _la_linspace(self, *args):
+        """Return equidistant values within a given interval."""
+        raise NotImplementedError
+
+    @abstractmethod
+    def _la_ndim(self, mat) -> int:
+        """Return the dimension of the tensor."""
+        raise NotImplementedError
+
+    @abstractmethod
+    def _la_repeat(self, mat, nreps):
+        """Makes repeated deep copies of a matrix."""
+        raise NotImplementedError
+
+    @abstractmethod
+    def _la_cdist(self, Amat, Bmat):
+        """
+        Return cthe euclidean distance between elements of two matrices.
+        Should be equivalent to
+        scipy.spatial.distance.cdist(Amat, Bmat, metric="euclidean")
+        """
+        raise NotImplementedError
+
+    @abstractmethod
+    def _la_einsum(self, *args):
+        """Compute Einstein summation on two tensors."""
+        raise NotImplementedError
+
+    @abstractmethod
+    def _la_trace(self, mat):
+        """Compute the trace of a matrix."""
+        raise NotImplementedError
+
+    @abstractmethod
+    def _la_copy(self, mat):
+        """Return a deep copy of a matrix."""
+        raise NotImplementedError
+
+    @abstractmethod
+    def _la_get_diagonal(self, mat):
+        """Return the diagonal of a matrix."""
+        raise NotImplementedError
+
+    @abstractmethod
+    def _la_isnan(self, mat):
+        """Determine what entries are NAN."""
+        raise NotImplementedError
+
+    @abstractmethod
+    def _la_atleast1d(self, val, dtype=None):
+        """Make an object at least a 1D tensor."""
+        raise NotImplementedError
+
+    @abstractmethod
+    def _la_atleast2d(self, val, dtype=None):
+        """Make an object at least a 2D tensor."""
+        raise NotImplementedError
+
+    @abstractmethod
+    def _la_reshape(self, mat, newshape):
+        """Reshape a matrix."""
+        raise NotImplementedError
+
+    @abstractmethod
+    def _la_where(self, cond):
+        """Return whether elements of a matrix satisfy a condition."""
+        raise NotImplementedError
+
+    @abstractmethod
+    def _la_tointeger(self, mat):
+        """Cast a matrix to integers"""
+        raise NotImplementedError
+
+    @abstractmethod
+    def _la_inf(self):
+        """Return native representation of infinity."""
+        raise NotImplementedError
+
+    @abstractmethod
+    def _la_norm(self, mat, axis=None):
+        """Return the norm of a matrix along a given axis."""
+        raise NotImplementedError
+
+    @abstractmethod
+    def _la_any(self, mat, axis=None):
+        """Find which elements of a matrix evaluates to True."""
+        raise NotImplementedError
+
+    @abstractmethod
+    def _la_kron(self, Amat, Bmat):
+        """Compute the Kroneker product of two matrices"""
+        raise NotImplementedError
+
+    @abstractmethod
+    def _la_slogdet(self, Amat):
+        """Compute the log determinant of a matrix"""
+        raise NotImplementedError
+
+    def _la_mean(self, mat, axis=None):
+        """Compute the mean of a matrix"""
+        raise NotImplementedError
+
+    def _la_std(self, mat, axis=None, ddof=0):
+        """Compute the standard-deviation of a matrix"""
+        raise NotImplementedError
+
+    def _la_cov(self, mat, ddof=0, rowvar=True):
+        """Compute the covariance matrix from samples of variables
+        in a matrix."""
+        raise NotImplementedError
+
+    def _la_abs(self, mat):
+        """Compute the absolte values of each entry in a matrix"""
+        raise NotImplementedError
+
+    def _la_detach(self, mat):
+        """Detach a matrix from the computational graph.
+        Override for backends that support automatic differentiation."""
+        return mat
+
+    def __repr__(self):
+        return "{0}".format(self.__class__.__name__)
+
+    def _la_block_cholesky_engine(self, L_A, L_A_inv_B, B, D, return_blocks):
+        schur_comp = D-self._la_multidot((L_A_inv_B.T, L_A_inv_B))
+        L_S = self._la_cholesky(schur_comp)
+        chol_blocks = [L_A, L_A_inv_B.T, L_S]
+        if return_blocks:
+            return chol_blocks
+        return self._la_vstack([
+            self._la_hstack([chol_blocks[0], 0*L_A_inv_B]),
+            self._la_hstack([chol_blocks[1], chol_blocks[2]])])
+
+    def _la_block_cholesky(self, blocks, return_blocks=False):
+        A, B = blocks[0]
+        D = blocks[1][1]
+        L_A = self._la_cholesky(A)
+        L_A_inv_B = self._la_solve_triangular(L_A, B)
+        return self._la_block_cholesky_engine(
+            L_A, L_A_inv_B, B, D, return_blocks)
+
+    def _la_get_correlation_from_covariance(self, cov):
+        r"""
+        Compute the correlation matrix from a covariance matrix
+        """
+        stdev_inv = 1/self._la_sqrt(self._la_get_diagonal(cov))
+        cor = stdev_inv[None, :]*cov*stdev_inv[:, None]
+        return cor
diff --git a/pyapprox/util/linearalgebra/numpylinalg.py b/pyapprox/util/linearalgebra/numpylinalg.py
new file mode 100644
index 00000000..4974f4fc
--- /dev/null
+++ b/pyapprox/util/linearalgebra/numpylinalg.py
@@ -0,0 +1,140 @@
+from typing import List
+
+import numpy as np
+import scipy
+
+from pyapprox.util.linearalgebra.linalgbase import LinAlgMixin
+
+
+class NumpyLinAlgMixin(LinAlgMixin):
+    def _la_dot(self, Amat: np.ndarray, Bmat: np.ndarray) -> np.ndarray:
+        return np.dot(Amat, Bmat)
+
+    def _la_eye(self, nrows: int) -> np.ndarray:
+        return np.eye(nrows)
+
+    def _la_inv(self, matrix: np.ndarray) -> np.ndarray:
+        return np.linalg.inv(matrix)
+
+    def _la_cholesky(self, matrix: np.ndarray) -> np.ndarray:
+        return np.linalg.cholesky(matrix)
+
+    def _la_cholesky_solve(self, chol: np.ndarray, bvec: np.ndarray,
+                           lower: bool = True) -> np.ndarray:
+        return scipy.linalg.cho_solve((chol, lower), bvec)
+
+    def _la_solve_triangular(self, Amat: np.ndarray, bvec: np.ndarray,
+                             lower: bool = True) -> np.ndarray:
+        return scipy.linalg.solve_triangular(Amat, bvec, lower=lower)
+
+    def _la_full(self, *args, dtype=float):
+        return np.full(*args, dtype=dtype)
+
+    def _la_empty(self, *args, dtype=float):
+        return np.empty(*args, dtype=dtype)
+
+    def _la_exp(self, matrix: np.ndarray) -> np.ndarray:
+        return np.exp(matrix)
+
+    def _la_sqrt(self, matrix: np.ndarray) -> np.ndarray:
+        return np.sqrt(matrix)
+
+    def _la_cos(self, matrix: np.ndarray) -> np.ndarray:
+        return np.cos(matrix)
+
+    def _la_arccos(self, matrix: np.ndarray) -> np.ndarray:
+        return np.arccos(matrix)
+
+    def _la_sin(self, matrix: np.ndarray) -> np.ndarray:
+        return np.sin(matrix)
+
+    def _la_log(self, matrix: np.ndarray) -> np.ndarray:
+        return np.log(matrix)
+
+    def _la_multidot(self, matrix_list: List[np.ndarray]) -> np.ndarray:
+        return np.linalg.multi_dot(matrix_list)
+
+    def _la_prod(self, matrix_list: np.ndarray, axis=None) -> np.ndarray:
+        return np.prod(matrix_list, dim=axis)
+
+    def _la_hstack(self, arrays) -> np.ndarray:
+        return np.hstack(arrays)
+
+    def _la_vstack(self, arrays) -> np.ndarray:
+        return np.vstack(arrays)
+
+    def _la_dstack(self, arrays) -> np.ndarray:
+        return np.dstack(arrays)
+
+    def _la_arange(self, *args) -> np.ndarray:
+        return np.arange(*args)
+
+    def _la_linspace(self, *args):
+        return np.linspace(*args)
+
+    def _la_ndim(self, mat: np.ndarray) -> int:
+        return mat.ndim
+
+    def _la_repeat(self, mat: np.ndarray, nreps: int) -> np.ndarray:
+        return np.tile(mat, nreps)
+
+    def _la_cdist(self, Amat: np.ndarray, Bmat: np.ndarray) -> np.ndarray:
+        return scipy.spatial.distance.cdist(Amat, Bmat, metric="euclidean")
+
+    def _la_einsum(self, *args) -> np.ndarray:
+        return np.einsum(*args)
+
+    def _la_trace(self, mat: np.ndarray) -> float:
+        return np.trace(mat)
+
+    def _la_copy(self, mat: np.ndarray) -> np.ndarray:
+        return mat.copy()
+
+    def _la_get_diagonal(self, mat: np.ndarray) -> np.ndarray:
+        return np.diagonal(mat)
+
+    def _la_isnan(self, mat: np.ndarray) -> np.ndarray:
+        return np.isnan(mat)
+
+    def _la_atleast1d(self, val, dtype=float) -> np.ndarray:
+        return np.atleast_1d(val).astype(dtype)
+
+    def _la_atleast2d(self, val, dtype=float) -> np.ndarray:
+        return np.atleast_2d(val).astype(dtype)
+
+    def _la_reshape(self, mat: np.ndarray, newshape) -> np.ndarray:
+        return np.reshape(mat, newshape)
+
+    def _la_where(self, cond: np.ndarray) -> np.ndarray:
+        return np.where(cond)
+
+    def _la_tointeger(self, mat: np.ndarray) -> np.ndarray:
+        return np.asarray(mat, dtype=int)
+
+    def _la_inf(self):
+        return np.inf
+
+    def _la_norm(self, mat: np.ndarray, axis=None) -> np.ndarray:
+        return np.linalg.norm(mat, axis=axis)
+
+    def _la_any(self, mat: np.ndarray, axis=None) -> np.ndarray:
+        return np.any(mat, axis=axis)
+
+    def _la_kron(self, Amat: np.ndarray, Bmat: np.ndarray) -> np.ndarray:
+        return np.kron(Amat, Bmat)
+
+    def _la_slogdet(self, Amat: np.ndarray) -> np.ndarray:
+        return np.linalg.slogdet(Amat)
+
+    def _la_mean(self, mat: np.ndarray, axis: int = None) -> np.ndarray:
+        return np.mean(mat, axis=axis)
+
+    def _la_std(self, mat: np.ndarray, axis: int = None,
+                ddof: int = 0) -> np.ndarray:
+        return np.std(mat, axis=axis, ddof=ddof)
+
+    def _la_cov(self, mat: np.ndarray, ddof=0, rowvar=True) -> np.ndarray:
+        return np.cov(mat, ddof=ddof, rowvar=rowvar)
+
+    def _la_abs(self, mat: np.ndarray) -> np.ndarray:
+        return np.absolute(mat)
diff --git a/pyapprox/util/linearalgebra/torchlinalg.py b/pyapprox/util/linearalgebra/torchlinalg.py
new file mode 100644
index 00000000..5b02376b
--- /dev/null
+++ b/pyapprox/util/linearalgebra/torchlinalg.py
@@ -0,0 +1,153 @@
+from typing import List
+
+import torch
+
+from pyapprox.util.linearalgebra.linalgbase import LinAlgMixin
+
+
+class TorchLinAlgMixin(LinAlgMixin):
+    def _la_dot(self, Amat: torch.Tensor, Bmat: torch.Tensor) -> torch.Tensor:
+        return Amat @ Bmat
+
+    def _la_eye(self, nrows: int) -> torch.Tensor:
+        return torch.eye(nrows)
+
+    def _la_inv(self, matrix: torch.Tensor) -> torch.Tensor:
+        return torch.linalg.inv(matrix)
+
+    def _la_cholesky(self, matrix: torch.Tensor) -> torch.Tensor:
+        return torch.linalg.cholesky(matrix)
+
+    def _la_cholesky_solve(self, chol: torch.Tensor, bvec: torch.Tensor,
+                           lower: bool = True) -> torch.Tensor:
+        return torch.cholesky_solve(bvec, chol, upper=(not lower))
+
+    def _la_solve_triangular(self, Amat: torch.Tensor, bvec: torch.Tensor,
+                             lower: bool = True) -> torch.Tensor:
+        return torch.linalg.solve_triangular(Amat, bvec, upper=(not lower))
+
+    def _la_full(self, *args, dtype=torch.double):
+        return torch.full(*args, dtype=dtype)
+
+    def _la_empty(self, *args, dtype=torch.double):
+        return torch.empty(*args, dtype=dtype)
+
+    def _la_exp(self, matrix: torch.Tensor) -> torch.Tensor:
+        return torch.exp(matrix)
+
+    def _la_sqrt(self, matrix: torch.Tensor) -> torch.Tensor:
+        return torch.sqrt(matrix)
+
+    def _la_cos(self, matrix: torch.Tensor) -> torch.Tensor:
+        return torch.cos(matrix)
+
+    def _la_arccos(self, matrix: torch.Tensor) -> torch.Tensor:
+        return torch.arccos(matrix)
+
+    def _la_sin(self, matrix: torch.Tensor) -> torch.Tensor:
+        return torch.sin(matrix)
+
+    def _la_log(self, matrix: torch.Tensor) -> torch.Tensor:
+        return torch.log(matrix)
+
+    def _la_multidot(self, matrix_list: List[torch.Tensor]) -> torch.Tensor:
+        return torch.linalg.multi_dot(matrix_list)
+
+    def _la_prod(self, matrix_list: torch.Tensor, axis=None) -> torch.Tensor:
+        return torch.prod(matrix_list, dim=axis)
+
+    def _la_hstack(self, arrays) -> torch.Tensor:
+        return torch.hstack(arrays)
+
+    def _la_vstack(self, arrays) -> torch.Tensor:
+        return torch.vstack(arrays)
+
+    def _la_dstack(self, arrays) -> torch.Tensor:
+        return torch.dstack(arrays)
+
+    def _la_arange(self, *args, dtype=torch.double) -> torch.Tensor:
+        return torch.arange(*args, dtype=dtype)
+
+    def _la_linspace(self, *args, dtype=torch.double):
+        return torch.linspace(*args, dtype=dtype)
+
+    def _la_ndim(self, mat: torch.Tensor) -> int:
+        return mat.ndim
+
+    def _la_repeat(self, mat: torch.Tensor, nreps: int) -> torch.Tensor:
+        return mat.repeat(nreps)
+
+    def _la_cdist(self, Amat: torch.tensor,
+                  Bmat: torch.tensor) -> torch.Tensor:
+        return torch.cdist(Amat, Bmat, p=2)
+
+    def _la_einsum(self, *args) -> torch.Tensor:
+        return torch.einsum(*args)
+
+    def _la_trace(self, mat: torch.Tensor) -> torch.Tensor:
+        return torch.trace(mat)
+
+    def _la_copy(self, mat: torch.Tensor) -> torch.Tensor:
+        return mat.clone()
+
+    def _la_get_diagonal(self, mat: torch.Tensor) -> torch.Tensor:
+        return torch.diagonal(mat)
+
+    def _la_isnan(self, mat) -> torch.Tensor:
+        return torch.isnan(mat)
+
+    def _la_atleast1d(self, val, dtype=torch.double) -> torch.Tensor:
+        return torch.atleast_1d(
+            torch.as_tensor(val, dtype=dtype))
+
+    def _la_atleast2d(self, val, dtype=torch.double) -> torch.Tensor:
+        return torch.atleast_2d(
+            torch.as_tensor(val, dtype=dtype))
+
+    def _la_reshape(self, mat: torch.Tensor, newshape) -> torch.Tensor:
+        return torch.reshape(mat, newshape)
+
+    def _la_where(self, cond: torch.Tensor) -> torch.Tensor:
+        return torch.where(cond)
+
+    def _la_detach(self, mat: torch.Tensor) -> torch.Tensor:
+        return mat.detach()
+
+    def _la_tointeger(self, mat: torch.Tensor) -> torch.Tensor:
+        return mat.int()
+
+    def _la_inf(self):
+        return torch.inf
+
+    def _la_norm(self, mat: torch.Tensor, axis=None) -> torch.Tensor:
+        return torch.linalg.norm(mat, dim=axis)
+
+    def _la_any(self, mat: torch.Tensor, axis=None) -> torch.Tensor:
+        if axis is None:
+            return torch.any(mat)
+        return torch.any(mat, dim=axis)
+
+    def _la_kron(self, Amat: torch.Tensor, Bmat: torch.Tensor) -> torch.Tensor:
+        return torch.kron(Amat, Bmat)
+
+    def _la_slogdet(self, Amat: torch.Tensor) -> torch.Tensor:
+        return torch.linalg.slogdet(Amat)
+
+    def _la_mean(self, mat: torch.Tensor, axis: int = None) -> torch.Tensor:
+        if axis is None:
+            return torch.mean(mat)
+        return torch.mean(mat, dim=axis)
+
+    def _la_std(self, mat: torch.Tensor, axis: int = None,
+                ddof: int = 0) -> torch.Tensor:
+        if axis is None:
+            return torch.std(mat, correction=ddof)
+        return torch.std(mat, dim=axis, correction=ddof)
+
+    def _la_cov(self, mat: torch.Tensor, ddof=0, rowvar=True) -> torch.Tensor:
+        if rowvar:
+            return torch.cov(mat, correction=ddof)
+        return torch.cov(mat.T, correction=ddof)
+
+    def _la_abs(self, mat: torch.Tensor) -> torch.Tensor:
+        return torch.absolute(mat)
diff --git a/pyapprox/surrogates/autogp/tests/test_hyperparameter.py b/pyapprox/util/tests/test_hyperparameter.py
similarity index 59%
rename from pyapprox/surrogates/autogp/tests/test_hyperparameter.py
rename to pyapprox/util/tests/test_hyperparameter.py
index 0fe378e0..9675700b 100644
--- a/pyapprox/surrogates/autogp/tests/test_hyperparameter.py
+++ b/pyapprox/util/tests/test_hyperparameter.py
@@ -1,16 +1,21 @@
 import unittest
 import numpy as np
 
-from pyapprox.surrogates.autogp.hyperparameter import (
-    LogHyperParameterTransform, IdentityHyperParameterTransform,
-    HyperParameter, HyperParameterList)
+from pyapprox.util.hyperparameter.numpyhyperparameter import (
+    NumpyLogHyperParameterTransform, NumpyIdentityHyperParameterTransform,
+    NumpyHyperParameter, NumpyHyperParameterList)
+from pyapprox.util.hyperparameter.torchhyperparameter import (
+    TorchLogHyperParameterTransform, TorchIdentityHyperParameterTransform,
+    TorchHyperParameter, TorchHyperParameterList)
 
 
 class TestHyperParameter(unittest.TestCase):
     def setUp(self):
         np.random.seed(1)
 
-    def test_hyperparameter(self):
+    def _check_hyperparameter(
+            self, LogHyperParameterTransform, IdentityHyperParameterTransform,
+            HyperParameter, HyperParameterList):
         transform_0 = LogHyperParameterTransform()
         hyp_0 = HyperParameter("P0", 3, 1, [0.01, 2], transform_0)
         assert np.allclose(
@@ -19,7 +24,7 @@ def test_hyperparameter(self):
 
         transform_1 = IdentityHyperParameterTransform()
         hyp_1 = HyperParameter(
-            "P1", 2, -0.5, [-1, 6, np.nan, np.nan], transform_1)
+            "P1", 2, -0.5, [-1, 6, -np.nan, np.nan], transform_1)
         hyp_list_0 = HyperParameterList([hyp_0, hyp_1])
         assert np.allclose(
             hyp_list_0.get_active_opt_bounds(), np.vstack((
@@ -39,6 +44,19 @@ def test_hyperparameter(self):
                 np.array([[-3, 3]]),
             )))
 
+    def test_hyperparameter(self):
+        test_cases = [
+            [NumpyLogHyperParameterTransform,
+             NumpyIdentityHyperParameterTransform, NumpyHyperParameter,
+             NumpyHyperParameterList],
+            [TorchLogHyperParameterTransform,
+             TorchIdentityHyperParameterTransform, TorchHyperParameter,
+             TorchHyperParameterList],
+        ]
+        for case in test_cases:
+            self._check_hyperparameter(*case)
+
+
 if __name__ == "__main__":
     hyperparameter_test_suite = unittest.TestLoader().loadTestsFromTestCase(
         TestHyperParameter)
diff --git a/pyapprox/surrogates/autogp/tests/test_transforms.py b/pyapprox/util/tests/test_transforms.py
similarity index 57%
rename from pyapprox/surrogates/autogp/tests/test_transforms.py
rename to pyapprox/util/tests/test_transforms.py
index 1b23252a..ec30344b 100644
--- a/pyapprox/surrogates/autogp/tests/test_transforms.py
+++ b/pyapprox/util/tests/test_transforms.py
@@ -2,33 +2,38 @@
 import numpy as np
 import torch
 
-from pyapprox.surrogates.autogp.transforms import (
-    NSphereCoordinateTransform, SphericalCorrelationTransform)
+from pyapprox.util.transforms.numpytransforms import (
+    NumpyNSphereCoordinateTransform, NumpySphericalCorrelationTransform)
+from pyapprox.util.transforms.torchtransforms import (
+    TorchNSphereCoordinateTransform, TorchSphericalCorrelationTransform)
 
 
 class TestTransforms(unittest.TestCase):
     def setUp(self):
         np.random.seed(1)
 
-    def check_nsphere_coordinate_transform(self, nvars):
+    def _check_nsphere_coordinate_transform(
+            self, nvars, NSphereCoordinateTransform):
         nsamples = 10
         trans = NSphereCoordinateTransform()
         psi = np.vstack((np.random.uniform(1, 2, (1, nsamples)),
                          np.random.uniform(0, np.pi, (nvars-2, nsamples)),
                          np.random.uniform(0, 2*np.pi, (1, nsamples))))
-        samples = trans.map_from_nsphere(
-            torch.as_tensor(psi, dtype=torch.double))
+        samples = trans.map_from_nsphere(trans._la_atleast2d(psi))
         psi_recovered = trans.map_to_nsphere(samples)
         assert np.allclose(psi_recovered, psi, rtol=1e-12)
 
     def test_nsphere_coordinate_transform(self):
         test_cases = [
-            [2], [3], [4], [5]
-        ]
+            [kk, NumpyNSphereCoordinateTransform] for kk in range(2, 6)]
+        test_cases += [
+            [kk, TorchNSphereCoordinateTransform] for kk in range(2, 6)]
         for test_case in test_cases:
-            self.check_nsphere_coordinate_transform(*test_case)
+            np.random.seed(1)
+            self._check_nsphere_coordinate_transform(*test_case)
 
-    def check_spherical_correlation_transform(self, noutputs):
+    def _check_spherical_correlation_transform(
+            self, noutputs, SphericalCorrelationTransform):
         # constrained formulation
         trans = SphericalCorrelationTransform(noutputs)
 
@@ -39,36 +44,34 @@ def check_spherical_correlation_transform(self, noutputs):
             np.random.uniform(0, np.pi, (trans.ntheta-trans.noutputs)),
         ))
 
-        psi = trans.map_theta_to_spherical(
-            torch.as_tensor(theta, dtype=torch.double))
+        psi = trans.map_theta_to_spherical(trans._la_atleast1d(theta))
         theta_recovered = trans.map_spherical_to_theta(psi)
         assert np.allclose(theta, theta_recovered, rtol=1e-12)
 
         L = trans.map_to_cholesky(
             torch.as_tensor(theta, dtype=torch.double))
-        theta_recovered = trans.map_from_cholesky(
-            torch.as_tensor(L, dtype=torch.double))
+        theta_recovered = trans.map_from_cholesky(L)
         assert np.allclose(theta, theta_recovered, rtol=1e-12)
 
     def test_spherical_correlation_transform(self):
         # Use test case from PINHEIRO 1 and BATES
         noutputs = 3
-        trans = SphericalCorrelationTransform(noutputs)
+        trans = NumpySphericalCorrelationTransform(noutputs)
         trans._unconstrained = True
-        L = np.array([[1, 0, 0], [1, 2, 0], [1, 2, 3]])
-        theta_recovered = trans.map_from_cholesky(
-            torch.as_tensor(L, dtype=torch.double))
-        theta = np.array(
+        L = trans._la_atleast2d([[1, 0, 0], [1, 2, 0], [1, 2, 3]])
+        theta_recovered = trans.map_from_cholesky(trans._la_atleast2d(L))
+        theta = trans._la_atleast1d(
             [0, np.log(5)/2, np.log(14)/2, -0.608, -0.348, -0.787])
         # answer is only reported to 3 decimals
         assert np.allclose(theta_recovered, theta, rtol=1e-3)
 
         test_cases = [
-            [2], [3], [4], [5]
-        ]
+            [kk, NumpySphericalCorrelationTransform] for kk in range(2, 6)]
+        test_cases += [
+            [kk, TorchSphericalCorrelationTransform] for kk in range(2, 6)]
         for test_case in test_cases:
             np.random.seed(1)
-            self.check_spherical_correlation_transform(*test_case)
+            self._check_spherical_correlation_transform(*test_case)
 
 
 if __name__ == "__main__":
diff --git a/pyapprox/util/transforms/__init__.py b/pyapprox/util/transforms/__init__.py
new file mode 100644
index 00000000..e69de29b
diff --git a/pyapprox/surrogates/autogp/transforms.py b/pyapprox/util/transforms/_transforms.py
similarity index 55%
rename from pyapprox/surrogates/autogp/transforms.py
rename to pyapprox/util/transforms/_transforms.py
index b9338ed4..b6146238 100644
--- a/pyapprox/surrogates/autogp/transforms.py
+++ b/pyapprox/util/transforms/_transforms.py
@@ -1,11 +1,8 @@
-import numpy as np
 from abc import ABC, abstractmethod
+import math
 
-from pyapprox.surrogates.autogp._torch_wrappers import (
-    sqrt, full, copy, arccos, sin, cos, empty, log, exp)
 
-
-class ValuesTransform(ABC):
+class Transform(ABC):
     @abstractmethod
     def map_from_canonical(self, values):
         raise NotImplementedError
@@ -14,12 +11,11 @@ def map_from_canonical(self, values):
     def map_to_canonical(self, values):
         raise NotImplementedError
 
-    @abstractmethod
     def map_stdev_from_canonical(self, canonical_stdevs):
         raise NotImplementedError
 
 
-class IdentityValuesTransform(ValuesTransform):
+class IdentityTransform(Transform):
     def map_from_canonical(self, values):
         return values
 
@@ -30,14 +26,22 @@ def map_stdev_from_canonical(self, canonical_stdevs):
         return canonical_stdevs
 
 
-class StandardDeviationValuesTransform(ValuesTransform):
-    def __init__(self):
+class StandardDeviationTransform(Transform):
+    def __init__(self, trans=False):
+        # todo: samples and values should always be (nvars, nsamples)
+        # where nvars=nqois but currently values is transpose of this
+        # so trans=True is used to deal with this case
+        self._trans = trans
         self._means = None
         self._stdevs = None
 
     def map_to_canonical(self, values):
-        self._means = values.mean(axis=0)[:, None]
-        self._stdevs = values.std(axis=0, ddof=1)[:, None]
+        if not self._trans:
+            self._means = self._la_mean(values, axis=1)[:, None]
+            self._stdevs = self._la_std(values, axis=1, ddof=1)[:, None]
+        else:
+            self._means = self._la_mean(values, axis=0)[:, None]
+            self._stdevs = self._la_std(values, axis=0, ddof=1)[:, None]
         canonical_values = (values-self._means)/self._stdevs
         return canonical_values
 
@@ -49,67 +53,77 @@ def map_stdev_from_canonical(self, canonical_stdevs):
         return canonical_stdevs*self._stdevs
 
 
-class NSphereCoordinateTransform():
+class NSphereCoordinateTransform(Transform):
     def map_to_nsphere(self, samples):
         nvars, nsamples = samples.shape
-        r = sqrt((samples**2).sum(axis=0))
-        psi = full(samples.shape, 0.)
-        psi[0] = copy(r)
-        psi[1] = arccos(samples[0]/r)
+        r = self._la_sqrt((samples**2).sum(axis=0))
+        psi = self._la_full(samples.shape, 0.)
+        psi[0] = self._la_copy(r)
+        psi[1] = self._la_arccos(samples[0]/r)
         for ii in range(2, nvars):
-            denom = copy(r)
+            denom = self._la_copy(r)
             for jj in range(ii-1):
-                denom *= sin(psi[jj+1])
-            psi[ii] = arccos(samples[ii-1]/denom)
-        psi[-1][samples[-1] < 0] = 2*np.pi-psi[-1][samples[-1] < 0]
+                denom *= self._la_sin(psi[jj+1])
+            psi[ii] = self._la_arccos(samples[ii-1]/denom)
+        psi[-1][samples[-1] < 0] = 2*math.pi-psi[-1][samples[-1] < 0]
         return psi
 
     def map_from_nsphere(self, psi):
         nvars, nsamples = psi.shape
-        r = copy(psi[0])
-        samples = full(psi.shape, 0.)
-        samples[0] = r*cos(psi[1])
+        r = self._la_copy(psi[0])
+        samples = self._la_full(psi.shape, 0.)
+        samples[0] = r*self._la_cos(psi[1])
         for ii in range(1, nvars):
-            samples[ii, :] = copy(r)
+            samples[ii, :] = self._la_copy(r)
             for jj in range(ii):
-                samples[ii] *= sin(psi[jj+1])
+                samples[ii] *= self._la_sin(psi[jj+1])
             if ii != nvars-1:
-                samples[ii] *= cos(psi[ii+1])
+                samples[ii] *= self._la_cos(psi[ii+1])
         return samples
 
+    def map_to_canonical(self, psi):
+        return self.map_from_nsphere(psi)
+
+    def map_from_canonical(self, canonical_samples):
+        return self.map_to_nsphere(canonical_samples)
 
-class SphericalCorrelationTransform():
+
+class SphericalCorrelationTransform(Transform):
     def __init__(self, noutputs):
         self.noutputs = noutputs
         self.ntheta = (self.noutputs*(self.noutputs+1))//2
-        self._theta_indices = np.full((self.ntheta, 2), -1, dtype=int)
-        self._theta_indices[:self.noutputs, 0] = np.arange(self.noutputs)
+        self._theta_indices = self._la_full((self.ntheta, 2), -1, dtype=int)
+        self._theta_indices[:self.noutputs, 0] = self._la_arange(self.noutputs)
         self._theta_indices[:self.noutputs, 1] = 0
         for ii in range(1, noutputs):
             for jj in range(1, ii+1):
                 # indices[ii, jj] = (
                 #     self.noutputs+((ii-1)*(ii))//2 + (jj-1))
                 self._theta_indices[
-                    self.noutputs+((ii-1)*(ii))//2 + (jj-1)] = ii, jj
-        self.nsphere_trans = NSphereCoordinateTransform()
+                    self.noutputs+((ii-1)*(ii))//2 + (jj-1)] = (
+                        self._la_atleast1d([ii, jj]))
+        self.nsphere_trans = self._NSphereCoordinateTransform()
         # unconstrained formulation does not seem unique.
         self._unconstrained = False
 
     def get_spherical_bounds(self):
+        inf = self._la_inf()
         if not self._unconstrained:
             # l_{i1} > 0,  i = 0,...,noutputs-1
-            # l_{ij} in (0, np.pi),    i = 1,...,noutputs-1, j=1,...,i
+            # l_{ij} in (0, math.pi),    i = 1,...,noutputs-1, j=1,...,i
             eps = 0
-            bounds = np.array([[eps, np.inf] for ii in range(self.noutputs)])
-            other_bounds = np.array([
-                [eps, np.pi-eps] for ii in range(self.noutputs, self.ntheta)])
-            bounds = np.vstack((bounds, other_bounds))
+            bounds = self._la_atleast2d(
+                [[eps, inf] for ii in range(self.noutputs)])
+            other_bounds = self._la_atleast2d([
+                [eps, math.pi-eps]
+                for ii in range(self.noutputs, self.ntheta)])
+            bounds = self._la_vstack((bounds, other_bounds))
             return bounds
 
-        return np.array([[-np.inf, np.inf] for ii in range(self.theta)])
+        return self._la_atleast2d([[-inf, inf] for ii in range(self.theta)])
 
     def map_cholesky_to_spherical(self, L):
-        psi = empty(L.shape)
+        psi = self._la_empty(L.shape)
         psi[0, 0] = L[0, 0]
         for ii in range(1, self.noutputs):
             psi[ii, :ii+1] = self.nsphere_trans.map_to_nsphere(
@@ -117,12 +131,12 @@ def map_cholesky_to_spherical(self, L):
         return psi
 
     def map_spherical_to_unconstrained_theta(self, psi):
-        theta = empty(self.ntheta)
-        theta[:self.noutputs] = log(psi[:, 0])
+        theta = self._la_empty(self.ntheta)
+        theta[:self.noutputs] = self._la_log(psi[:, 0])
         psi_flat = psi[
             self._theta_indices[self.noutputs:, 0],
             self._theta_indices[self.noutputs:, 1]]
-        theta[self.noutputs:] = log(psi_flat/(np.pi-psi_flat))
+        theta[self.noutputs:] = self._la_log(psi_flat/(math.pi-psi_flat))
         return theta
 
     def map_spherical_to_theta(self, psi):
@@ -135,19 +149,20 @@ def map_from_cholesky(self, L):
         return self.map_spherical_to_theta(psi)
 
     def map_unconstrained_theta_to_spherical(self, theta):
-        psi = full((self.noutputs, self.noutputs), 0.)
+        psi = self._la_full((self.noutputs, self.noutputs), 0.)
         # psi[ii, :] are radius of hypersphere of increasing dimension
         # all other psi are angles
-        exp_theta = exp(theta)
+        exp_theta = self._la_exp(theta)
         psi[:, 0] = exp_theta[:self.noutputs]
         psi[self._theta_indices[self.noutputs:, 0],
             self._theta_indices[self.noutputs:, 1]] = (
-                exp_theta[self.noutputs:]*np.pi/(1+exp_theta[self.noutputs:]))
+                exp_theta[self.noutputs:]*math.pi/(
+                    1+exp_theta[self.noutputs:]))
         # cnt = self.noutputs
         # for ii in range(1, self.noutputs):
         #     for jj in range(1, ii+1):
         #         exp_theta = exp(theta[cnt])
-        #         psi[ii, jj] = exp_theta*np.pi/(1+exp_theta)
+        #         psi[ii, jj] = exp_theta*math.pi/(1+exp_theta)
         #         cnt += 1
         return psi
 
@@ -157,12 +172,12 @@ def map_theta_to_spherical(self, theta):
         if self._unconstrained:
             psi = self.map_unconstrained_theta_to_spherical(theta)
             return self.map_spherical_to_cholesky(psi)
-        psi = full((self.noutputs, self.noutputs), 0.)
+        psi = self._la_full((self.noutputs, self.noutputs), 0.)
         psi[self._theta_indices[:, 0], self._theta_indices[:, 1]] = theta
         return psi
 
     def map_spherical_to_cholesky(self, psi):
-        L_factor = full((self.noutputs, self.noutputs), 0.)
+        L_factor = self._la_full((self.noutputs, self.noutputs), 0.)
         L_factor[0, 0] = psi[0, 0]
         for ii in range(1, self.noutputs):
             L_factor[ii:ii+1, :ii+1] = self.nsphere_trans.map_from_nsphere(
@@ -172,3 +187,9 @@ def map_spherical_to_cholesky(self, psi):
     def map_to_cholesky(self, theta):
         psi = self.map_theta_to_spherical(theta)
         return self.map_spherical_to_cholesky(psi)
+
+    def map_to_canonical(self, samples):
+        return self._map_from_cholesky(samples)
+
+    def map_from_canonical(self, canonical_samples):
+        return self._map_to_cholesky(canonical_samples)
diff --git a/pyapprox/util/transforms/numpytransforms.py b/pyapprox/util/transforms/numpytransforms.py
new file mode 100644
index 00000000..e00aac92
--- /dev/null
+++ b/pyapprox/util/transforms/numpytransforms.py
@@ -0,0 +1,24 @@
+from pyapprox.util.linearalgebra.numpylinalg import NumpyLinAlgMixin
+from pyapprox.util.transforms._transforms import (
+    IdentityTransform, StandardDeviationTransform,
+    NSphereCoordinateTransform, SphericalCorrelationTransform)
+
+
+NumpyIdentityTransform = IdentityTransform
+
+
+class NumpyStandardDeviationTransform(
+        StandardDeviationTransform, NumpyLinAlgMixin):
+    pass
+
+
+class NumpyNSphereCoordinateTransform(
+        NSphereCoordinateTransform, NumpyLinAlgMixin):
+    pass
+
+
+class NumpySphericalCorrelationTransform(
+        SphericalCorrelationTransform, NumpyLinAlgMixin):
+    def __init__(self, noutputs):
+        self._NSphereCoordinateTransform = NumpyNSphereCoordinateTransform
+        super().__init__(noutputs)
diff --git a/pyapprox/util/transforms/torchtransforms.py b/pyapprox/util/transforms/torchtransforms.py
new file mode 100644
index 00000000..86d0c69f
--- /dev/null
+++ b/pyapprox/util/transforms/torchtransforms.py
@@ -0,0 +1,24 @@
+from pyapprox.util.linearalgebra.torchlinalg import TorchLinAlgMixin
+from pyapprox.util.transforms._transforms import (
+    IdentityTransform, StandardDeviationTransform,
+    NSphereCoordinateTransform, SphericalCorrelationTransform)
+
+
+TorchIdentityTransform = IdentityTransform
+
+
+class TorchStandardDeviationTransform(
+        StandardDeviationTransform, TorchLinAlgMixin):
+    pass
+
+
+class TorchNSphereCoordinateTransform(
+        NSphereCoordinateTransform, TorchLinAlgMixin):
+    pass
+
+
+class TorchSphericalCorrelationTransform(
+        SphericalCorrelationTransform, TorchLinAlgMixin):
+    def __init__(self, noutputs):
+        self._NSphereCoordinateTransform = TorchNSphereCoordinateTransform
+        super().__init__(noutputs)
diff --git a/setup.py b/setup.py
index 5b264c1c..6055cf70 100644
--- a/setup.py
+++ b/setup.py
@@ -72,6 +72,7 @@ def no_cythonize(extensions, **_ignore):
     },
     ext_modules=extensions,
     license='MIT',
+    package_dir={'': ''},
 )
 
 #TODO see https://pytest-cov.readthedocs.io/en/latest/config.html

From a21c58faa45be360039b55a6ed3616e875910981 Mon Sep 17 00:00:00 2001
From: John Jakeman <jdjakem@users.noreply.github.com>
Date: Thu, 23 May 2024 09:06:29 -0600
Subject: [PATCH 05/15] Use LinalgMixins to create torch and numpy KLEs

---
 pyapprox/benchmarks/pde_benchmarks.py         | 55 +++-----------
 pyapprox/expdesign/tests/test_optbayes.py     |  3 +-
 pyapprox/interface/model.py                   |  9 +++
 pyapprox/pde/hdg/parameterized_models.py      |  4 +-
 pyapprox/pde/kle/__init__.py                  |  3 +
 .../_kle.py}                                  | 72 +++++++++----------
 pyapprox/pde/kle/numpykle.py                  | 10 +++
 pyapprox/pde/kle/torchkle.py                  | 48 +++++++++++++
 pyapprox/pde/tests/test_karhunen_loeve.py     | 38 ++++++----
 .../surrogates/autogp/tests/test_mokernels.py |  2 +-
 pyapprox/util/linearalgebra/linalgbase.py     | 27 ++++++-
 pyapprox/util/linearalgebra/numpylinalg.py    | 19 +++++
 pyapprox/util/linearalgebra/torchlinalg.py    | 23 ++++++
 13 files changed, 212 insertions(+), 101 deletions(-)
 create mode 100644 pyapprox/pde/kle/__init__.py
 rename pyapprox/pde/{karhunen_loeve_expansion.py => kle/_kle.py} (89%)
 create mode 100644 pyapprox/pde/kle/numpykle.py
 create mode 100644 pyapprox/pde/kle/torchkle.py

diff --git a/pyapprox/benchmarks/pde_benchmarks.py b/pyapprox/benchmarks/pde_benchmarks.py
index 9d55b4b3..daf8fd15 100644
--- a/pyapprox/benchmarks/pde_benchmarks.py
+++ b/pyapprox/benchmarks/pde_benchmarks.py
@@ -15,7 +15,7 @@
 )
 from pyapprox.variables import IndependentMarginalsVariable
 from pyapprox.variables.transforms import ConfigureVariableTransformation
-from pyapprox.pde.karhunen_loeve_expansion import MeshKLE, TorchKLEWrapper
+from pyapprox.pde.kle.torchkle import TorchMeshKLE, TorchInterpolatedMeshKLE
 from pyapprox.interface.wrappers import (
     evaluate_1darray_function_on_2d_array, MultiIndexModel, ModelEnsemble)
 
@@ -96,12 +96,12 @@ def loglike_functional_dqdp(obs, obs_indices, noise_std, sol, params):
 def raw_advection_diffusion_reaction_kle_dRdp(kle, residual, sol, param_vals):
     mesh = residual.mesh
     dmats = [residual.mesh._dmat(dd) for dd in range(mesh.nphys_vars)]
-    if kle.use_log:
+    if kle._use_log:
         # compute gradient of diffusivity with respect to KLE coeff
         assert param_vals.ndim == 1
         kle_vals = kle(param_vals[:, None])
         assert kle_vals.ndim == 2
-        dkdp = kle_vals*kle.eig_vecs
+        dkdp = kle_vals*kle._eig_vecs
     else:
         dkdp = kle.eig_vecs
     Du = [torch.linalg.multi_dot((dmats[dd], sol))
@@ -123,9 +123,9 @@ def advection_diffusion_reaction_kle_dRdp(
         elif bndry_cond[1] == "R":
             mesh_pts_idx = mesh._bndry_slice(mesh.mesh_pts, idx, 1)
             normal_vals = mesh._bndrys[ii].normals(mesh_pts_idx)
-            if kle.use_log:
+            if kle._use_log:
                 kle_vals = kle(param_vals[:, None])
-                dkdp = kle_vals*kle.eig_vecs
+                dkdp = kle_vals*kle._eig_vecs
             else:
                 dkdp = torch.as_tensor(kle.eig_vecs)
             flux_vals = [
@@ -206,7 +206,7 @@ def _fast_interpolate(self, values, xx):
     def _set_random_sample(self, sample):
         self._fwd_solver.physics._diff_fun = partial(
             self._fast_interpolate,
-            self._kle(sample[:, None]))
+            self._kle(self._kle._la_atleast2d(sample[:, None])))
 
     def _eval(self, sample, return_grad=False):
         sample_copy = torch.as_tensor(sample.copy(), dtype=torch.double)
@@ -341,12 +341,12 @@ def _setup_advection_diffusion_benchmark(
     vel_fun = partial(constant_vel_fun, vel_vec)
 
     if kle_args is None:
-        npkle = MeshKLE(
+        kle = TorchMeshKLE(
             mesh.mesh_pts, length_scale, sigma=sigma, nterms=nvars,
             use_log=True, mean_field=kle_mean_field)
-        kle = TorchKLEWrapper(npkle)
+        # kle = TorchKLEWrapper(npkle)
     else:
-        kle = InterpolatedMeshKLE(kle_args[0], kle_args[1], mesh)
+        kle = TorchInterpolatedMeshKLE(kle_args[0], kle_args[1], mesh)
 
     if time_scenario is None:
         forc_fun = partial(gauss_forc_fun, amp, scale, loc)
@@ -371,43 +371,6 @@ def _setup_advection_diffusion_benchmark(
     return model, variable
 
 
-class InterpolatedMeshKLE(MeshKLE):
-    def __init__(self, kle_mesh, kle, mesh):
-        self._kle_mesh = kle_mesh
-        self._kle = kle
-        self._mesh = mesh
-
-        self.matern_nu = self._kle._matern_nu
-        self.nterms = self._kle._nterms
-        self.lenscale = self._kle._lenscale
-
-        self._basis_mat = self._kle_mesh._get_lagrange_basis_mat(
-            self._kle_mesh._canonical_mesh_pts_1d,
-            mesh._map_samples_to_canonical_domain(self._mesh.mesh_pts))
-
-    def _fast_interpolate(self, values, xx):
-        assert xx.shape[1] == self._mesh.mesh_pts.shape[1]
-        assert np.allclose(xx, self._mesh.mesh_pts)
-        interp_vals = torch.linalg.multi_dot((self._basis_mat, values))
-        # assert np.allclose(
-        #     interp_vals, self._kle_mesh.interpolate(values, xx))
-        return interp_vals
-
-    def __call__(self, coef):
-        assert isinstance(self._kle, TorchKLEWrapper)
-        # use_log = self._kle._use_log
-        use_log = self._kle._kle._use_log
-        self._kle._kle._use_log = False
-        vals = self._kle(coef)
-        interp_vals = self._fast_interpolate(vals, self._mesh.mesh_pts)
-        mean_field = self._fast_interpolate(
-            torch.as_tensor(self._kle._mean_field[:, None], dtype=torch.double),
-            self._mesh.mesh_pts)
-        if use_log:
-            interp_vals = torch.exp(mean_field+interp_vals)
-        self._kle._kle._use_log = use_log
-        return interp_vals
-
 
 def _setup_inverse_advection_diffusion_benchmark(
         amp, scale, loc, nobs, noise_std, length_scale, sigma, nvars, orders,
diff --git a/pyapprox/expdesign/tests/test_optbayes.py b/pyapprox/expdesign/tests/test_optbayes.py
index 9129c61e..107be174 100644
--- a/pyapprox/expdesign/tests/test_optbayes.py
+++ b/pyapprox/expdesign/tests/test_optbayes.py
@@ -215,7 +215,7 @@ def _check_classical_KL_OED_gaussian_optimization(
         x0 = np.full((nobs, 1), nfinal_obs/nobs)
         errors = objective.check_apply_jacobian(
             x0, disp=True, fd_eps=np.logspace(-13, np.log(0.2), 13)[::-1])
-        assert errors.min()/errors.max() < 6e-6, errors.min()/errors.max()
+        assert errors.min()/errors.max() < 7e-6, errors.min()/errors.max()
         # turn on hessian for testing hessian implementation, but
         # apply hessian is turned off because while it reduces
         # optimization iteration count but increases
@@ -371,6 +371,7 @@ def _check_prediction_gaussian_OED(
         result = optimizer.minimize(x0)
         print(result.x)
 
+    @unittest.skip("Implementation not finished")
     def test_prediction_gaussian_OED(self):
         test_cases = [
             [3, 0, 1, 4000, 50, NoiseStatistic(SampleAverageMean())],
diff --git a/pyapprox/interface/model.py b/pyapprox/interface/model.py
index 383661c4..5a6cb149 100644
--- a/pyapprox/interface/model.py
+++ b/pyapprox/interface/model.py
@@ -662,8 +662,17 @@ def __init__(self, function, nvars, inactive_var_values,
         assert np.all(self._active_var_indices < self._nvars)
         self._inactive_var_indices = np.delete(
             np.arange(self._nvars), active_var_indices)
+        if base_model is None:
+            base_model = function
         self._base_model = base_model
 
+        self._jacobian_implemented = self._base_model._jacobian_implemented
+        self._apply_jacobian_implemented = (
+            self._base_model._apply_jacobian_implemented)
+        self._hessian_implemented = self._base_model._hessian_implemented
+        self._apply_hessian_implemented = (
+            self._base_model._apply_hessian_implemented)
+
     @staticmethod
     def _expand_samples_from_indices(reduced_samples, active_var_indices,
                                      inactive_var_indices,
diff --git a/pyapprox/pde/hdg/parameterized_models.py b/pyapprox/pde/hdg/parameterized_models.py
index 597da6d6..b720ce4f 100644
--- a/pyapprox/pde/hdg/parameterized_models.py
+++ b/pyapprox/pde/hdg/parameterized_models.py
@@ -22,7 +22,7 @@
 from skfem.visuals.matplotlib import plot, plt
 from skfem import MeshQuad, Functional
 from pyapprox.pde.galerkin.meshes import init_gappy
-from pyapprox.pde.karhunen_loeve_expansion import MeshKLE
+from pyapprox.pde.kle.torchkle import TorchMeshKLE
 
 
 def full_fun_axis_0(fill_val, xx, oned=True):
@@ -832,7 +832,7 @@ def _init_kle(self, *args):
         self._common_mesh_pts_dict = common_matrix_rows(mesh_pts.T)
         unique_indices = np.array(
             [item[0] for key, item in self._common_mesh_pts_dict.items()])
-        kle = MeshKLE(mesh_pts[:, unique_indices], use_log=True)
+        kle = TorchMeshKLE(mesh_pts[:, unique_indices], use_log=True)
         kle.compute_basis(length_scale, sigma, nterms)
         return kle, mesh_pts
 
diff --git a/pyapprox/pde/kle/__init__.py b/pyapprox/pde/kle/__init__.py
new file mode 100644
index 00000000..4ca5370f
--- /dev/null
+++ b/pyapprox/pde/kle/__init__.py
@@ -0,0 +1,3 @@
+"""The :mod:`pyapprox.pde` module implements numerical methods
+for solving partial differential equations (PDEs).
+"""
diff --git a/pyapprox/pde/karhunen_loeve_expansion.py b/pyapprox/pde/kle/_kle.py
similarity index 89%
rename from pyapprox/pde/karhunen_loeve_expansion.py
rename to pyapprox/pde/kle/_kle.py
index 2744dafe..72fd1072 100644
--- a/pyapprox/pde/karhunen_loeve_expansion.py
+++ b/pyapprox/pde/kle/_kle.py
@@ -294,22 +294,32 @@ def _compute_basis(self):
         """
         K = self._compute_kernel_matrix()
         if self._quad_weights is None:
+            # always compute eigenvalue decomposition using scipy because
+            # it can be used to only compute subset of eigenvectors
+            # then we cast these back to correct linalg type. The downside
+            # is that we cannot use autograd on quantities used to consturct K.
+            # but the need for this is unlikely
             eig_vals, eig_vecs = eigh(
-                K, turbo=False,
+                self._la_to_numpy(K), turbo=False,
                 subset_by_index=(K.shape[0]-self._nterms, K.shape[0]-1))
+            eig_vals = self._la_atleast1d(eig_vals)
+            eig_vecs = self._la_atleast2d(eig_vecs)
         else:
             # see https://etheses.lse.ac.uk/2950/1/U615901.pdf
             # page 42
-            sqrt_weights = np.sqrt(self._quad_weights)
+            sqrt_weights = self._la_sqrt(self._quad_weights)
             sym_eig_vals, sym_eig_vecs = eigh(
-                sqrt_weights[:, None]*K*sqrt_weights, turbo=False,
+                self._la_to_numpy(sqrt_weights[:, None]*K*sqrt_weights),
                 subset_by_index=(K.shape[0]-self._nterms, K.shape[0]-1))
+            sym_eig_vals = self._la_atleast1d(sym_eig_vals)
+            sym_eig_vecs = self._la_atleast2d(sym_eig_vecs)
             eig_vecs = 1/sqrt_weights[:, None]*sym_eig_vecs
             eig_vals = sym_eig_vals
         eig_vecs = adjust_sign_eig(eig_vecs)
-        II = np.argsort(eig_vals)[::-1][:self._nterms]
-        assert np.all(eig_vals[II] > 0), eig_vals[II]
-        self._sqrt_eig_vals = np.sqrt(eig_vals[II])
+        # II = self._la_argsort(eig_vals)[::-1][:self._nterms]
+        II = self._la_flip(self._la_argsort(eig_vals))[:self._nterms]
+        assert self._la_all(eig_vals[II] > 0), eig_vals[II]
+        self._sqrt_eig_vals = self._la_sqrt(eig_vals[II])
         self._eig_vecs = eig_vecs[:, II]
 
     def __call__(self, coef):
@@ -324,8 +334,9 @@ def __call__(self, coef):
         assert coef.ndim == 2
         assert coef.shape[0] == self._nterms
         if self._use_log:
-            return np.exp(self._mean_field[:, None]+self._eig_vecs.dot(coef))
-        return self._mean_field[:, None] + self._eig_vecs.dot(coef)
+            return self._la_exp(
+                self._mean_field[:, None] + self._eig_vecs@coef)
+        return self._mean_field[:, None] + self._eig_vecs@coef
 
     def __repr__(self):
         if self._nterms is None:
@@ -364,7 +375,8 @@ def __init__(self, mesh_coords, length_scale, sigma=1., mean_field=0,
 
     def _set_mean_field(self, mean_field):
         if np.isscalar(mean_field):
-            mean_field = np.ones(self._mesh_coords.shape[1])*mean_field
+            mean_field = self._la_full(
+                (self._mesh_coords.shape[1],), 1)*mean_field
         super()._set_mean_field(mean_field)
 
     def _set_nterms(self, nterms):
@@ -378,21 +390,24 @@ def _set_mesh_coordinates(self, mesh_coords):
         self._mesh_coords = mesh_coords
 
     def _set_lenscale(self, length_scale):
-        length_scale = np.atleast_1d(length_scale)
+        length_scale = self._la_atleast1d(length_scale)
         if length_scale.shape[0] == 1:
-            length_scale = np.full(self._mesh_coords.shape[0], length_scale[0])
+            length_scale = self._la_full(
+                (self._mesh_coords.shape[0],), length_scale[0])
         assert length_scale.shape[0] == self._mesh_coords.shape[0]
         self._lenscale = length_scale
 
     def _compute_kernel_matrix(self):
         if self._matern_nu == np.inf:
-            dists = pdist(self._mesh_coords.T / self._lenscale,
-                          metric='sqeuclidean')
+            dists = pdist(
+                self._la_to_numpy(self._mesh_coords.T / self._lenscale),
+                metric='sqeuclidean')
             K = squareform(np.exp(-.5 * dists))
             np.fill_diagonal(K, 1)
-            return K
+            return self._la_atleast2d(K)
 
-        dists = pdist(self._mesh_coords.T / self._lenscale, metric='euclidean')
+        dists = pdist(self._la_to_numpy(
+            self._mesh_coords.T / self._lenscale), metric='euclidean')
         if self._matern_nu == 0.5:
             K = squareform(np.exp(-dists))
         elif self._matern_nu == 1.5:
@@ -401,7 +416,7 @@ def _compute_kernel_matrix(self):
         elif self._matern_nu == 2.5:
             K = squareform((1+dists+dists**2/3)*np.exp(-dists))
         np.fill_diagonal(K, 1)
-        return K
+        return self._la_atleast2d(K)
 
     def __repr__(self):
         if self._nterms is None:
@@ -412,26 +427,6 @@ def __repr__(self):
             self._lenscale, self._sigma)
 
 
-class TorchKLEWrapper(AbstractKLE):
-    def __init__(self, kle):
-        import torch
-        self._kle = kle
-        for attr in self._kle.__dict__.keys():
-            setattr(self, attr, self._kle.__dict__[attr])
-
-    def __call__(self, coef):
-        import torch
-        return torch.as_tensor(self._kle(coef), dtype=torch.double)
-
-    def __repr__(self):
-        return "TorchWrapper({0})".format(self._kle.__repr__())
-
-    def _compute_kernel_matrix(self):
-        import torch
-        return torch.as_tensor(
-            self.kle._compute_kernel_matrix(), dtype=torch.double)
-
-
 class DataDrivenKLE(AbstractKLE):
     def __init__(self, field_samples, mean_field=0,
                  use_log=False, nterms=None):
@@ -440,7 +435,8 @@ def __init__(self, field_samples, mean_field=0,
 
     def _set_mean_field(self, mean_field):
         if np.isscalar(mean_field):
-            mean_field = np.ones(self._field_samples.shape[0])*mean_field
+            mean_field = self._la_full(
+                (self._field_samples.shape[0],), 1)*mean_field
         super()._set_mean_field(mean_field)
 
     def _set_nterms(self, nterms):
@@ -453,7 +449,7 @@ def _set_mesh_coordinaets(self, mesh_coords):
         self._mesh_coords = None
 
     def _compute_kernel_matrix(self):
-        return np.cov(self._field_samples, rowvar=True, ddof=1)
+        return self._la_cov(self._field_samples, rowvar=True, ddof=1)
 
 
 def multivariate_chain_rule(jac_yu, jac_ux):
diff --git a/pyapprox/pde/kle/numpykle.py b/pyapprox/pde/kle/numpykle.py
new file mode 100644
index 00000000..aa911dea
--- /dev/null
+++ b/pyapprox/pde/kle/numpykle.py
@@ -0,0 +1,10 @@
+from pyapprox.util.linearalgebra.numpylinalg import NumpyLinAlgMixin
+from pyapprox.pde.kle._kle import MeshKLE, DataDrivenKLE
+
+
+class NumpyMeshKLE(MeshKLE, NumpyLinAlgMixin):
+    pass
+
+
+class NumpyDataDrivenKLE(DataDrivenKLE, NumpyLinAlgMixin):
+    pass
diff --git a/pyapprox/pde/kle/torchkle.py b/pyapprox/pde/kle/torchkle.py
new file mode 100644
index 00000000..69712503
--- /dev/null
+++ b/pyapprox/pde/kle/torchkle.py
@@ -0,0 +1,48 @@
+import numpy as np
+
+from pyapprox.util.linearalgebra.torchlinalg import TorchLinAlgMixin
+from pyapprox.pde.kle._kle import MeshKLE, DataDrivenKLE
+
+
+class TorchMeshKLE(MeshKLE, TorchLinAlgMixin):
+    pass
+
+
+class TorchDataDrivenKLE(DataDrivenKLE, TorchLinAlgMixin):
+    pass
+
+
+class TorchInterpolatedMeshKLE(MeshKLE, TorchLinAlgMixin):
+    # TODO make this work for any linalgmix in and move to _kle.py
+    # This requires larger changes to autopde
+    def __init__(self, kle_mesh, kle, mesh):
+        self._kle_mesh = kle_mesh
+        self._kle = kle
+        assert isinstance(self._kle, TorchMeshKLE)
+        self._mesh = mesh
+
+        self.matern_nu = self._kle._matern_nu
+        self.nterms = self._kle._nterms
+        self.lenscale = self._kle._lenscale
+
+        self._basis_mat = self._kle_mesh._get_lagrange_basis_mat(
+            self._kle_mesh._canonical_mesh_pts_1d,
+            mesh._map_samples_to_canonical_domain(self._mesh.mesh_pts))
+
+    def _fast_interpolate(self, values, xx):
+        assert xx.shape[1] == self._mesh.mesh_pts.shape[1]
+        assert np.allclose(xx, self._mesh.mesh_pts)
+        interp_vals = self._la_multidot((self._basis_mat, values))
+        return interp_vals
+
+    def __call__(self, coef):
+        use_log = self._kle._use_log
+        self._kle._use_log = False
+        vals = self._kle(coef)
+        interp_vals = self._fast_interpolate(vals, self._mesh.mesh_pts)
+        mean_field = self._fast_interpolate(
+            self._kle._mean_field[:, None], self._mesh.mesh_pts)
+        if use_log:
+            interp_vals = self._la_exp(mean_field+interp_vals)
+        self._kle._use_log = use_log
+        return interp_vals
diff --git a/pyapprox/pde/tests/test_karhunen_loeve.py b/pyapprox/pde/tests/test_karhunen_loeve.py
index 6f792c9c..4a55f648 100644
--- a/pyapprox/pde/tests/test_karhunen_loeve.py
+++ b/pyapprox/pde/tests/test_karhunen_loeve.py
@@ -2,9 +2,14 @@
 
 import numpy as np
 
-from pyapprox.pde.karhunen_loeve_expansion import (
-    multivariate_chain_rule, MeshKLE, compute_kle_gradient_from_mesh_gradient,
-    KLE1D, DataDrivenKLE)
+from pyapprox.pde.kle._kle import (
+    multivariate_chain_rule, compute_kle_gradient_from_mesh_gradient, KLE1D)
+
+from pyapprox.util.linearalgebra.numpylinalg import NumpyLinAlgMixin
+from pyapprox.pde.kle.numpykle import NumpyMeshKLE, NumpyDataDrivenKLE
+
+from pyapprox.util.linearalgebra.torchlinalg import TorchLinAlgMixin
+from pyapprox.pde.kle.torchkle import TorchMeshKLE, TorchDataDrivenKLE
 from pyapprox.util.utilities import approx_jacobian
 
 
@@ -56,7 +61,7 @@ def test_compute_kle_gradient_from_mesh_gradient(self):
         kle_mean = mesh[0, :]+2
 
         for use_log in [False, True]:
-            kle = MeshKLE(
+            kle = NumpyMeshKLE(
                 mesh, length_scale, mean_field=kle_mean, use_log=use_log,
                 sigma=sigma, nterms=nvars)
 
@@ -97,8 +102,8 @@ def test_mesh_kle_1D(self):
         mesh_coords = (mesh_coords+1)/2*dom_len+lb
         quad_weights *= (ub-lb)/2
         mesh_coords = mesh_coords[None, :]
-        kle = MeshKLE(mesh_coords, len_scale, sigma=sigma, nterms=nterms,
-                      matern_nu=0.5, quad_weights=quad_weights)
+        kle = NumpyMeshKLE(mesh_coords, len_scale, sigma=sigma, nterms=nterms,
+                           matern_nu=0.5, quad_weights=quad_weights)
 
         opts = {"mean_field": 0, "sigma2": sigma, "corr_len": len_scale,
                 "num_vars": int(kle._nterms), "use_log": False,
@@ -149,7 +154,7 @@ def trapezoid_rule(level):
         mesh_coords = (mesh_coords+1)/2*dom_len+lb
         quad_weights *= (ub-lb)/2
         mesh_coords = mesh_coords[None, :]
-        kle = MeshKLE(
+        kle = NumpyMeshKLE(
             mesh_coords, len_scale, sigma=sigma, nterms=nterms,
             matern_nu=0.5, quad_weights=quad_weights)
 
@@ -163,7 +168,7 @@ def trapezoid_rule(level):
         quad_weights1 *= (ub1-lb1)/2
         mesh_coords1 = mesh_coords1[None, :]
 
-        kle1 = MeshKLE(
+        kle1 = NumpyMeshKLE(
             mesh_coords1, len_scale, sigma=sigma, nterms=nterms,
             matern_nu=0.5, quad_weights=quad_weights1)
 
@@ -208,7 +213,7 @@ def trapezoid_rule(level):
         quad_weights *= (ub-lb)/2
         mesh_coords = mesh_coords[None, :]
         quad_weights = None
-        kle = MeshKLE(mesh_coords, len_scale, sigma=sigma, nterms=nterms,
+        kle = NumpyMeshKLE(mesh_coords, len_scale, sigma=sigma, nterms=nterms,
                       matern_nu=0.5, quad_weights=quad_weights)
 
         # quad_rule = clenshaw_curtis_pts_wts_1D
@@ -237,7 +242,7 @@ def trapezoid_rule(level):
         # assert np.allclose(mesh_coords, mesh_coords_mix)
         # assert np.allclose(quad_weights, quad_weights_mix)
 
-        kle_mix = MeshKLE(
+        kle_mix = NumpyMeshKLE(
             mesh_coords_mix, len_scale, sigma=sigma, nterms=nterms,
             matern_nu=0.5, quad_weights=quad_weights_mix)
 
@@ -253,13 +258,15 @@ def trapezoid_rule(level):
         # plt.plot(mesh_coords_mix[0, :], eig_vecs_mix, 'r--s')
         # plt.show()
 
-    def test_data_driven_kle(self):
+    def _check_data_driven_kle(self, MeshKLE, DataDrivenKLE, la):
         level = 10
         nterms = 3
         len_scale, sigma = 1, 1
         from pyapprox.surrogates.orthopoly.quadrature import (
             clenshaw_curtis_pts_wts_1D)
         mesh_coords, quad_weights = clenshaw_curtis_pts_wts_1D(level)
+        mesh_coords = la._la_atleast1d(mesh_coords)
+        quad_weights = la._la_atleast1d(quad_weights)
         quad_weights *= 2   # remove pdf of uniform variable
         # map to [lb, ub]
         lb, ub = 0, 2
@@ -272,13 +279,20 @@ def test_data_driven_kle(self):
                       matern_nu=0.5, quad_weights=quad_weights)
 
         nsamples = 10000
-        samples = np.random.normal(0., 1., (nterms, nsamples))
+        samples = la._la_atleast2d(
+            np.random.normal(0., 1., (nterms, nsamples)))
         kle_realizations = kle(samples)
 
         # TODO: pass in optiional quadrature weights
         kle_data = DataDrivenKLE(kle_realizations, nterms=nterms)
         print(kle_data._sqrt_eig_vals, kle._sqrt_eig_vals)
 
+    def test_data_driven_kle(self):
+        test_cases = [[NumpyMeshKLE, NumpyDataDrivenKLE, NumpyLinAlgMixin()],
+                      [TorchMeshKLE, TorchDataDrivenKLE, TorchLinAlgMixin()]]
+        for case in test_cases:
+            self._check_data_driven_kle(*case)
+
 
 if __name__ == "__main__":
     kle_test_suite = unittest.TestLoader().loadTestsFromTestCase(
diff --git a/pyapprox/surrogates/autogp/tests/test_mokernels.py b/pyapprox/surrogates/autogp/tests/test_mokernels.py
index 074e4e74..de61f099 100644
--- a/pyapprox/surrogates/autogp/tests/test_mokernels.py
+++ b/pyapprox/surrogates/autogp/tests/test_mokernels.py
@@ -331,7 +331,7 @@ def _check_block_cholesky(self, MaternKernel, Monomial):
         L_true = np.linalg.cholesky(kmat)
 
         blocks = kernel(samples_per_output, block_format=True)
-        L = kernel._cholesky(noutputs, blocks, block_format=False)
+        L = kernel._cholesky(noutputs, blocks, block_format=False, la=kernel)
         assert np.allclose(L, L_true)
 
         L_blocks = kernel._cholesky(noutputs, blocks, block_format=True)
diff --git a/pyapprox/util/linearalgebra/linalgbase.py b/pyapprox/util/linearalgebra/linalgbase.py
index 9843e074..eddabeea 100644
--- a/pyapprox/util/linearalgebra/linalgbase.py
+++ b/pyapprox/util/linearalgebra/linalgbase.py
@@ -193,7 +193,12 @@ def _la_norm(self, mat, axis=None):
 
     @abstractmethod
     def _la_any(self, mat, axis=None):
-        """Find which elements of a matrix evaluates to True."""
+        """Find if any element of a matrix evaluates to True."""
+        raise NotImplementedError
+
+    @abstractmethod
+    def _la_all(self, mat, axis=None):
+        """Find if all elements of a matrix evaluate to True."""
         raise NotImplementedError
 
     @abstractmethod
@@ -223,6 +228,26 @@ def _la_abs(self, mat):
         """Compute the absolte values of each entry in a matrix"""
         raise NotImplementedError
 
+    def _la_to_numpy(self, mat):
+        """Compute the matrix to a np.ndarray."""
+        raise NotImplementedError
+
+    def _la_argsort(self, mat, axis=-1):
+        """Compute the indices that sort a matrix in ascending order."""
+        raise NotImplementedError
+
+    def _la_sort(self, mat, axis=-1):
+        """Return the matrix sorted in ascending order."""
+        raise NotImplementedError
+
+    def _la_flip(self, mat, axis=None):
+        "Reverse the order of the elements in a matrix."
+        raise NotImplementedError
+
+    def _la_allclose(self, Amat, Bmat, **kwargs):
+        "Check if two matries are close"
+        raise NotImplementedError
+
     def _la_detach(self, mat):
         """Detach a matrix from the computational graph.
         Override for backends that support automatic differentiation."""
diff --git a/pyapprox/util/linearalgebra/numpylinalg.py b/pyapprox/util/linearalgebra/numpylinalg.py
index 4974f4fc..6f075a1b 100644
--- a/pyapprox/util/linearalgebra/numpylinalg.py
+++ b/pyapprox/util/linearalgebra/numpylinalg.py
@@ -120,6 +120,9 @@ def _la_norm(self, mat: np.ndarray, axis=None) -> np.ndarray:
     def _la_any(self, mat: np.ndarray, axis=None) -> np.ndarray:
         return np.any(mat, axis=axis)
 
+    def _la_all(self, mat: np.ndarray, axis=None) -> np.ndarray:
+        return np.all(mat, axis=axis)
+
     def _la_kron(self, Amat: np.ndarray, Bmat: np.ndarray) -> np.ndarray:
         return np.kron(Amat, Bmat)
 
@@ -138,3 +141,19 @@ def _la_cov(self, mat: np.ndarray, ddof=0, rowvar=True) -> np.ndarray:
 
     def _la_abs(self, mat: np.ndarray) -> np.ndarray:
         return np.absolute(mat)
+
+    def _la_to_numpy(self, mat: np.ndarray) -> np.ndarray:
+        return mat
+
+    def _la_argsort(self, mat: np.ndarray, axis=-1) -> np.ndarray:
+        return np.argsort(mat, axis=axis)
+
+    def _la_sort(self, mat: np.ndarray, axis=-1) -> np.ndarray:
+        return np.sort(mat, axis=axis)
+
+    def _la_flip(self, mat, axis=None):
+        return np.flip(mat, axis=axis)
+
+    def _la_allclose(self, Amat: np.ndarray, Bmat: np.ndarray,
+                     **kwargs) -> bool:
+        return np.allclose(Amat, Bmat, **kwargs)
diff --git a/pyapprox/util/linearalgebra/torchlinalg.py b/pyapprox/util/linearalgebra/torchlinalg.py
index 5b02376b..fc592005 100644
--- a/pyapprox/util/linearalgebra/torchlinalg.py
+++ b/pyapprox/util/linearalgebra/torchlinalg.py
@@ -127,6 +127,11 @@ def _la_any(self, mat: torch.Tensor, axis=None) -> torch.Tensor:
             return torch.any(mat)
         return torch.any(mat, dim=axis)
 
+    def _la_all(self, mat: torch.Tensor, axis=None) -> torch.Tensor:
+        if axis is None:
+            return torch.all(mat)
+        return torch.all(mat, dim=axis)
+
     def _la_kron(self, Amat: torch.Tensor, Bmat: torch.Tensor) -> torch.Tensor:
         return torch.kron(Amat, Bmat)
 
@@ -151,3 +156,21 @@ def _la_cov(self, mat: torch.Tensor, ddof=0, rowvar=True) -> torch.Tensor:
 
     def _la_abs(self, mat: torch.Tensor) -> torch.Tensor:
         return torch.absolute(mat)
+
+    def _la_to_numpy(self, mat: torch.Tensor):
+        return mat.numpy()
+
+    def _la_argsort(self, mat: torch.Tensor, axis=-1) -> torch.Tensor:
+        return torch.argsort(mat, dim=axis)
+
+    def _la_sort(self, mat: torch.Tensor, axis=-1) -> torch.Tensor:
+        return torch.sort(mat, dim=axis)
+
+    def _la_flip(self, mat: torch.Tensor, axis=None) -> torch.Tensor:
+        if axis is None:
+            axis = (0,)
+        return torch.flip(mat, dims=axis)
+
+    def _la_allclose(self, Amat: torch.Tensor, Bmat: torch.Tensor,
+                     **kwargs) -> bool:
+        return torch.allclose(Amat, Bmat, **kwargs)

From 3505920d134e27f78f61b7845da5bed24ec61e89 Mon Sep 17 00:00:00 2001
From: John Jakeman <jdjakem@users.noreply.github.com>
Date: Thu, 23 May 2024 09:57:05 -0600
Subject: [PATCH 06/15] Fix a few small bugs picked up by CI that I am not sure
 exactly were introduced

---
 pyapprox/interface/model.py                  |  3 ++-
 pyapprox/interface/tests/test_model.py       | 21 +++++--------------
 pyapprox/multifidelity/acv.py                |  2 +-
 pyapprox/optimization/tests/test_minimize.py |  2 +-
 pyapprox/pde/time_integration.py             |  5 ++++-
 pyapprox/surrogates/interp/tensorprod.py     | 22 +++++++++++++-------
 6 files changed, 27 insertions(+), 28 deletions(-)

diff --git a/pyapprox/interface/model.py b/pyapprox/interface/model.py
index 5a6cb149..35bd317f 100644
--- a/pyapprox/interface/model.py
+++ b/pyapprox/interface/model.py
@@ -293,7 +293,8 @@ def __call__(self, samples):
 
 class ModelFromCallable(SingleSampleModel):
     def __init__(self, function, jacobian=None, apply_jacobian=None,
-                 apply_hessian=None, hessian=None, sample_ndim=2, values_ndim=2):
+                 apply_hessian=None, hessian=None, sample_ndim=2,
+                 values_ndim=2):
         """
         Parameters
         ----------
diff --git a/pyapprox/interface/tests/test_model.py b/pyapprox/interface/tests/test_model.py
index 183ecfcb..af991d8a 100644
--- a/pyapprox/interface/tests/test_model.py
+++ b/pyapprox/interface/tests/test_model.py
@@ -30,9 +30,9 @@ def test_scalar_model_from_callable_2D_sample(self):
         model = ModelFromCallable(
             lambda sample: self._evaluate_sp_lambda(
                 sp.lambdify(symbs, sp_fun, "numpy"), sample),
-            lambda sample, vec: self._evaluate_sp_lambda(
+            apply_jacobian=lambda sample, vec: self._evaluate_sp_lambda(
                 sp.lambdify(symbs, sp_grad, "numpy"), sample) @ vec,
-            lambda sample, vec: self._evaluate_sp_lambda(
+            apply_hessian=lambda sample, vec: self._evaluate_sp_lambda(
                 sp.lambdify(symbs, sp_hessian), sample) @ vec)
         sample = np.random.uniform(0, 1, (nvars, 1))
         model.check_apply_jacobian(sample, disp=True)
@@ -72,8 +72,6 @@ def test_scalar_model_from_callable_1D_sample(self):
         errors = model.check_apply_hessian(sample)
         assert errors[0] < 1e-15
 
-        
-
     def test_vector_model_from_callable(self):
         symbs = sp.symbols(["x", "y", "z"])
         nvars = len(symbs)
@@ -83,7 +81,7 @@ def test_vector_model_from_callable(self):
         model = ModelFromCallable(
             lambda sample: self._evaluate_sp_lambda(
                 sp.lambdify(symbs, sp_fun, "numpy"), sample),
-            lambda sample, vec: self._evaluate_sp_lambda(
+            apply_jacobian=lambda sample, vec: self._evaluate_sp_lambda(
                 sp.lambdify(symbs, sp_grad, "numpy"), sample) @ vec)
         sample = np.random.uniform(0, 1, (nvars, 1))
         model.check_apply_jacobian(sample, disp=True)
@@ -102,9 +100,9 @@ def test_scipy_wrapper(self):
         model = ModelFromCallable(
             lambda sample: self._evaluate_sp_lambda(
                 sp.lambdify(symbs, sp_fun, "numpy"), sample),
-            lambda sample, vec: self._evaluate_sp_lambda(
+            apply_jacobian=lambda sample, vec: self._evaluate_sp_lambda(
                 sp.lambdify(symbs, sp_grad, "numpy"), sample) @ vec,
-            lambda sample, vec: self._evaluate_sp_lambda(
+            apply_hessian=lambda sample, vec: self._evaluate_sp_lambda(
                 sp.lambdify(symbs, sp_hessian), sample) @ vec)
         scipy_model = ScipyModelWrapper(model)
         # check scipy model works with 1D sample array
@@ -115,15 +113,6 @@ def test_scipy_wrapper(self):
         assert np.allclose(scipy_model.hess(sample), self._evaluate_sp_lambda(
                sp.lambdify(symbs, sp_hessian, "numpy"), sample[:, None]))
 
-        # test error is thrown if scipy model does not return a scalar output
-        sp_fun = [sum([s*(ii+1) for ii, s in enumerate(symbs)])**4,
-                  sum([s*(ii+1) for ii, s in enumerate(symbs)])**5]
-        model = ModelFromCallable(
-            lambda sample: self._evaluate_sp_lambda(
-                sp.lambdify(symbs, sp_fun, "numpy"), sample))
-        scipy_model = ScipyModelWrapper(model)
-        self.assertRaises(ValueError, scipy_model, sample)
-
     def test_umbridge_model(self):
         server_dir = os.path.dirname(__file__)
         url = 'http://localhost:4242'
diff --git a/pyapprox/multifidelity/acv.py b/pyapprox/multifidelity/acv.py
index 27a88c72..d82c7a50 100644
--- a/pyapprox/multifidelity/acv.py
+++ b/pyapprox/multifidelity/acv.py
@@ -615,7 +615,7 @@ def bootstrap(self, values_per_model, nbootstraps=1000,
                 CF, cf = self._get_discrepancy_covariances(
                     self._rounded_npartition_samples)
                 weights = self._weights(CF, cf)
-                weights_list.append(weights.flatten())
+                weights_list.append(weights.flatten().numpy())
             else:
                 weights = self._optimized_weights
             estimator_vals.append(self._estimate(
diff --git a/pyapprox/optimization/tests/test_minimize.py b/pyapprox/optimization/tests/test_minimize.py
index 1d0a2717..85220e26 100644
--- a/pyapprox/optimization/tests/test_minimize.py
+++ b/pyapprox/optimization/tests/test_minimize.py
@@ -218,7 +218,7 @@ def _jacobian(self, x):
         basis = UnivariatePiecewiseQuadraticBasis()
         nodes = np.linspace(*stats.norm(0, 1).interval(1-1e-6), nsamples)
         print(nodes)
-        weights = basis.quadrature_weights(nodes)
+        weights = basis._quadrature_rule_from_nodes(nodes[None, :])[1][:, 0]
         weights = (weights*stats.norm(0, 1).pdf(nodes))[:, None]
         samples = np.vstack([nodes[None, :], nodes[None, :]*sigma2+mu2])
         stat = SampleAverageConditionalValueAtRisk([0.5, 0.85], eps=1e-3)
diff --git a/pyapprox/pde/time_integration.py b/pyapprox/pde/time_integration.py
index a0122c8f..40ad0fd8 100644
--- a/pyapprox/pde/time_integration.py
+++ b/pyapprox/pde/time_integration.py
@@ -164,7 +164,10 @@ def __call__(self, prev_sol, prev_time, deltat):
         raise NotImplementedError
 
     def integrate(self, times, sols):
-        return self._basis.integrate(times, sols)
+        self._basis.set_nodes(times[None, :])
+        quad_weights = self._basis.quadrature_rule()[1]
+        active_indices = self._basis._active_node_indices_for_quadrature()
+        return (quad_weights*sols[active_indices].sum(axis=0))
 
 
 class ImplicitTimeIntegratorUpdate(TimeIntegratorUpdate):
diff --git a/pyapprox/surrogates/interp/tensorprod.py b/pyapprox/surrogates/interp/tensorprod.py
index bc5b8e8d..899ca134 100644
--- a/pyapprox/surrogates/interp/tensorprod.py
+++ b/pyapprox/surrogates/interp/tensorprod.py
@@ -446,12 +446,6 @@ def quadrature_rule(self):
         self._check_samples(samples)
         return samples, weights
 
-    def integrate(self, vals):
-        weights = self.quadrature_rule()[1]
-        if vals.ndim != 2 or vals.ndim != weights.shape[0]:
-            raise ValueError("vals and weights are inconsistent")
-        return (weights[:, None]*vals).sum()
-
     @abstractmethod
     def nterms(self):
         raise NotImplementedError
@@ -471,11 +465,11 @@ def set_nodes(self, nodes):
         self._nodes = nodes
 
     @abstractmethod
-    def _evaluate_from_nodes(self):
+    def _evaluate_from_nodes(self, nodes):
         raise NotImplementedError
 
     @abstractmethod
-    def _quadrature_rule_from_nodes(self):
+    def _quadrature_rule_from_nodes(self, nodes):
         raise NotImplementedError
 
     def _evaluate(self, samples):
@@ -495,6 +489,9 @@ def __repr__(self):
         return "{0}(nnodes={1})".format(
             self.__class__.__name__, self.nterms())
 
+    def _active_node_indices_for_quadrature(self):
+        return np.arange(self.nterms())
+
 
 class UnivariatePiecewiseLeftConstantBasis(UnivariateInterpolatingBasis):
     @staticmethod
@@ -508,6 +505,9 @@ def _quadrature_rule_from_nodes(nodes):
     def nterms(self):
         return self._nodes.shape[1]-1
 
+    def _active_node_indices_for_quadrature(self):
+        return np.arange(self.nterms()-1)
+
 
 class UnivariatePiecewiseRightConstantBasis(UnivariateInterpolatingBasis):
     @staticmethod
@@ -522,6 +522,9 @@ def _quadrature_rule_from_nodes(nodes):
     def nterms(self):
         return self._nodes.shape[1]-1
 
+    def _active_node_indices_for_quadrature(self):
+        return np.arange(1, self.nterms())
+
 
 class UnivariatePiecewiseMidPointConstantBasis(UnivariateInterpolatingBasis):
     @staticmethod
@@ -536,6 +539,9 @@ def _quadrature_rule_from_nodes(nodes):
     def nterms(self):
         return self._nodes.shape[1]-1
 
+    def _active_node_indices_for_quadrature(self):
+        raise ValueError("Quadrature points do not coincide with nodes")
+
 
 class UnivariatePiecewiseLinearBasis(UnivariateInterpolatingBasis):
     @staticmethod

From 105beb903cc5764f6073c0af230bd6bba7919f07 Mon Sep 17 00:00:00 2001
From: John Jakeman <jdjakem@users.noreply.github.com>
Date: Thu, 23 May 2024 10:44:58 -0600
Subject: [PATCH 07/15] Try to remove need for latex when running
 plot_bayesian_oed.py

---
 tutorials/expdesign/plot_bayesian_oed.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/tutorials/expdesign/plot_bayesian_oed.py b/tutorials/expdesign/plot_bayesian_oed.py
index bd5f388c..31ff856d 100644
--- a/tutorials/expdesign/plot_bayesian_oed.py
+++ b/tutorials/expdesign/plot_bayesian_oed.py
@@ -291,6 +291,7 @@ def plot_posteriors(
 cvar_p2 = 0.2
 data_markers = ["X", "s", "o"]
 data_latex_markers = [r"\times", r"\square", r"\circ"]
+data_latex_markers = [r"A", r"B", r"C"]
 joint_prior_noise_variable = IndependentMarginalsVariable(
     prior_rvs + [noise_rv])
 if prior_variable.num_vars() == 1:

From 4632b4fda8c4675b6c9d30a04dfdcfce60cd83d1 Mon Sep 17 00:00:00 2001
From: John Jakeman <jdjakem@users.noreply.github.com>
Date: Thu, 23 May 2024 12:57:24 -0600
Subject: [PATCH 08/15] Fix issues in tutorial scripts.

Change scaling in optimization used in plot_multioutput_acv.py

Update plot_bayesian_oed.py to use new interpolant interface
---
 .../continuous-integration-workflow-conda.yml       |  8 +++++---
 .../continuous-integration-workflow-docs.yml        |  8 +++++---
 .../continuous-integration-workflow-pip.yml         |  8 +++++---
 pyapprox/benchmarks/tests/test_pde_benchmarks.py    |  2 +-
 pyapprox/optimization/tests/test_minimize.py        |  6 +++---
 pyapprox/surrogates/autogp/tests/test_mokernels.py  | 13 +++++++------
 tutorials/expdesign/plot_bayesian_oed.py            |  8 +++-----
 tutorials/multi_fidelity/plot_multioutput_acv.py    |  2 +-
 8 files changed, 30 insertions(+), 25 deletions(-)

diff --git a/.github/workflows/continuous-integration-workflow-conda.yml b/.github/workflows/continuous-integration-workflow-conda.yml
index 0b135695..e822cca5 100644
--- a/.github/workflows/continuous-integration-workflow-conda.yml
+++ b/.github/workflows/continuous-integration-workflow-conda.yml
@@ -1,9 +1,11 @@
 name: Build and Test Using Conda
 
 on:
-  push:
-    # branches: [master, devel]
-    branches: [master]
+  # push:
+  # branches: [master, devel]
+  # branches: [master]
+  pull_request:
+    branches: [devel]
 
   workflow_dispatch:
 
diff --git a/.github/workflows/continuous-integration-workflow-docs.yml b/.github/workflows/continuous-integration-workflow-docs.yml
index d0dfec09..492dcc2d 100644
--- a/.github/workflows/continuous-integration-workflow-docs.yml
+++ b/.github/workflows/continuous-integration-workflow-docs.yml
@@ -1,9 +1,11 @@
 name: Build Docs Using Conda
 
 on:
-  push:
-    branches: [master]
-    # branches: [master, devel]
+  # push:
+  # branches: [master]
+  # branches: [master, devel]
+  pull_request:
+    branches: [devel]
 
   workflow_dispatch:
 
diff --git a/.github/workflows/continuous-integration-workflow-pip.yml b/.github/workflows/continuous-integration-workflow-pip.yml
index c7c92543..c1d12651 100644
--- a/.github/workflows/continuous-integration-workflow-pip.yml
+++ b/.github/workflows/continuous-integration-workflow-pip.yml
@@ -1,9 +1,11 @@
 name: Build and Test Using Pip
 
 on:
-  push:
-    # branches: [master, devel]
-    branches: [master]
+  #push:
+  # branches: [master, devel]
+  # branches: [master]
+  pull_request:
+    branches: [devel]  
 
   workflow_dispatch:
 
diff --git a/pyapprox/benchmarks/tests/test_pde_benchmarks.py b/pyapprox/benchmarks/tests/test_pde_benchmarks.py
index 9bdfc7a8..e4e88aaf 100644
--- a/pyapprox/benchmarks/tests/test_pde_benchmarks.py
+++ b/pyapprox/benchmarks/tests/test_pde_benchmarks.py
@@ -259,7 +259,7 @@ def test_setup_transient_multi_index_advection_diffusion_benchmark(self):
         # plt.loglog(
         #     ndof[:-1], np.abs((qoi_means[-1]-qoi_means[:-1])/qoi_means[-1]))
         # plt.show()
-        assert (rel_diffs.max() > 4e-2 and rel_diffs.min() < 9.5e-5)
+        assert (rel_diffs.max() > 4e-2 and rel_diffs.min() < 1e-4)
 
 
 if __name__ == "__main__":
diff --git a/pyapprox/optimization/tests/test_minimize.py b/pyapprox/optimization/tests/test_minimize.py
index 85220e26..47cfb966 100644
--- a/pyapprox/optimization/tests/test_minimize.py
+++ b/pyapprox/optimization/tests/test_minimize.py
@@ -206,7 +206,7 @@ def _jacobian(self, x):
         weights = np.full((nsamples, 1), 1/nsamples)
         # from pyapprox.surrogates.orthopoly.quadrature import (
         #     gauss_hermite_pts_wts_1D)
-        
+
         # nsamples = 1000
         # samples = np.vstack(
         #     [gauss_hermite_pts_wts_1D(nsamples)[0],
@@ -254,7 +254,7 @@ def _jacobian(self, x):
             np.full((ndesign_vars+nconstraints,), np.inf))
         optimizer = ScipyConstrainedOptimizer(
             objective, bounds=bounds, constraints=[constraint],
-            opts={"gtol": 1e-6, "verbose": 3, "maxiter": 200})
+            opts={"gtol": 1e-6, "verbose": 3, "maxiter": 500})
         result = optimizer.minimize(opt_x0)
 
         # errors in sample based estimate of CVaR will cause
@@ -264,7 +264,7 @@ def _jacobian(self, x):
         # print(constraint(exact_opt_x), [CVaR1, CVaR2])
         # print(result.x-exact_opt_x[:, 0], exact_opt_x[:, 0])
         assert np.allclose(result.x, exact_opt_x[:, 0], rtol=1e-3, atol=1e-6)
-        assert np.allclose(-sigma1, result.fun, rtol=1e-5)
+        assert np.allclose(-sigma1, result.fun, rtol=1e-4)
 
 
 if __name__ == '__main__':
diff --git a/pyapprox/surrogates/autogp/tests/test_mokernels.py b/pyapprox/surrogates/autogp/tests/test_mokernels.py
index de61f099..9704183e 100644
--- a/pyapprox/surrogates/autogp/tests/test_mokernels.py
+++ b/pyapprox/surrogates/autogp/tests/test_mokernels.py
@@ -334,20 +334,21 @@ def _check_block_cholesky(self, MaternKernel, Monomial):
         L = kernel._cholesky(noutputs, blocks, block_format=False, la=kernel)
         assert np.allclose(L, L_true)
 
-        L_blocks = kernel._cholesky(noutputs, blocks, block_format=True)
-        L = kernel._cholesky_blocks_to_dense(*L_blocks)
+        L_blocks = kernel._cholesky(
+            noutputs, blocks, block_format=True, la=kernel)
+        L = kernel._cholesky_blocks_to_dense(*L_blocks, la=kernel)
         assert np.allclose(L, L_true)
         assert np.allclose(
-            kernel._logdet(*L_blocks), np.linalg.slogdet(kmat)[1])
+            kernel._logdet(*L_blocks, la=kernel), np.linalg.slogdet(kmat)[1])
         values = np.random.normal(0, 1, (L.shape[1], 1))
         assert np.allclose(
-            kernel._lower_solve_triangular(*L_blocks, values),
+            kernel._lower_solve_triangular(*L_blocks, values, la=kernel),
             scipy.linalg.solve_triangular(L, values, lower=True))
         assert np.allclose(
-            kernel._upper_solve_triangular(*L_blocks, values),
+            kernel._upper_solve_triangular(*L_blocks, values, la=kernel),
             scipy.linalg.solve_triangular(L.T, values, lower=False))
         assert np.allclose(
-            kernel._cholesky_solve(*L_blocks, values),
+            kernel._cholesky_solve(*L_blocks, values, la=kernel),
             np.linalg.inv(kmat) @ values)
 
     def test_block_cholesky(self):
diff --git a/tutorials/expdesign/plot_bayesian_oed.py b/tutorials/expdesign/plot_bayesian_oed.py
index 31ff856d..59a2e1f0 100644
--- a/tutorials/expdesign/plot_bayesian_oed.py
+++ b/tutorials/expdesign/plot_bayesian_oed.py
@@ -596,8 +596,8 @@ def compute_deviations(design_pt, prior_noise_quad_data, noise_std, xx, ww,
 def interpolate_deviation(nsamples_1d, basis_type, quad_data, deviations,
                           samples):
     # assumes same samples for each dimension
-    abscissa_1d = [quad_data[0][0, :nsamples_1d[0]],
-                   quad_data[0][1, ::nsamples_1d[0]]]
+    abscissa_1d = [quad_data[0][:1, :nsamples_1d[0]],
+                   quad_data[0][1:2, ::nsamples_1d[0]]]
     assert deviations.ndim == 1
     interp = TensorProductInterpolant(
         [get_univariate_interpolation_basis(basis_type) for ii in range(2)])
@@ -830,6 +830,7 @@ def plot_risk_prediction_deviation_surface(
     xx = np.linspace(pred_pts[0, 0], pred_pts[0, -1], 101)[None, :]
     interp = TensorProductInterpolant(
         [get_univariate_interpolation_basis(basis_type)])
+    pred_pts = [p[None, :] for p in pred_pts]
     interp.fit(pred_pts, expected_deviations)
     vals = interp(xx)
     ax.plot(xx[0], vals)
@@ -842,7 +843,6 @@ def plot_risk_prediction_deviation_surface(
         prior_noise_quad_data, deviations[ii, ..., dev_idx],
         joint_qmc_xx, joint_qmc_ww, deviation_symbs[dev_idx], design_symbs[ii],
         axs[ii], basis_type, nsamples_1d, pred_wts, pred_pts)
-plt.show()
 
 
 #%%
@@ -890,5 +890,3 @@ def plot_risk_prediction_deviation_pdf(
 axs_kl_pred_pdf.set_xlabel(mathrm_label("Divergence") + r" $\phi$")
 if savefigs:
     fig_kl_pred_pdf.savefig("oed-workflow-kl-pred-div-pdfs.pdf")
-
-plt.show()
diff --git a/tutorials/multi_fidelity/plot_multioutput_acv.py b/tutorials/multi_fidelity/plot_multioutput_acv.py
index 503de64d..91c934dd 100644
--- a/tutorials/multi_fidelity/plot_multioutput_acv.py
+++ b/tutorials/multi_fidelity/plot_multioutput_acv.py
@@ -32,7 +32,7 @@
 stat = mf.multioutput_stats["mean"](benchmark.nqoi)
 stat.set_pilot_quantities(cov)
 est = mf.get_estimator("gmf", stat, costs)
-est.allocate_samples(target_cost)
+est.allocate_samples(target_cost, {"scaling": 1.})
 
 # get covariance of just first qoi
 qoi_idx = [0]

From dad5deec203b5d89fbb786b09a98ffe50f6b7c3a Mon Sep 17 00:00:00 2001
From: John Jakeman <jdjakem@users.noreply.github.com>
Date: Thu, 23 May 2024 13:09:44 -0600
Subject: [PATCH 09/15] Try to fix tolerances to account for across platform
 differences

---
 pyapprox/expdesign/linear_oed.py                             | 1 +
 pyapprox/expdesign/tests/test_linear_oed.py                  | 2 +-
 pyapprox/multifidelity/tests/test_multioutput_monte_carlo.py | 3 ++-
 pyapprox/optimization/tests/test_l1_minimization.py          | 2 +-
 4 files changed, 5 insertions(+), 3 deletions(-)

diff --git a/pyapprox/expdesign/linear_oed.py b/pyapprox/expdesign/linear_oed.py
index d72f8e9c..4a68e91d 100644
--- a/pyapprox/expdesign/linear_oed.py
+++ b/pyapprox/expdesign/linear_oed.py
@@ -470,6 +470,7 @@ def doptimality_criterion(homog_outer_prods, design_factors,
     M0, M1 = get_M0_and_M1_matrices(
         homog_outer_prods, design_prob_measure, noise_multiplier,
         regression_type)
+    print(M1, "#!@, M1", np.linalg.cond(M1))
     M1_inv = np.linalg.inv(M1)
     if noise_multiplier is not None:
         gamma = M0.dot(M1_inv)
diff --git a/pyapprox/expdesign/tests/test_linear_oed.py b/pyapprox/expdesign/tests/test_linear_oed.py
index 0ea2369d..3791c2fd 100644
--- a/pyapprox/expdesign/tests/test_linear_oed.py
+++ b/pyapprox/expdesign/tests/test_linear_oed.py
@@ -1047,7 +1047,7 @@ def test_michaelis_menten_model_minimax_d_optimal_least_squares_design(
         opt_problem = NonLinearAlphabetOptimalDesign('D', local_design_factors)
         mu = opt_problem.solve_nonlinear_minimax(
             parameter_samples, design_samples[np.newaxis, :],
-            {'iprint': 1, 'ftol': 1e-8})
+            {'iprint': 1, 'ftol': 1e-6, 'disp': True})
         II = np.where(mu > 1e-5)[0]
         # given largest theta_2=1 then optimal design will be at 1/3,1
         # with masses=0.5
diff --git a/pyapprox/multifidelity/tests/test_multioutput_monte_carlo.py b/pyapprox/multifidelity/tests/test_multioutput_monte_carlo.py
index ff7f93e0..4c167a70 100644
--- a/pyapprox/multifidelity/tests/test_multioutput_monte_carlo.py
+++ b/pyapprox/multifidelity/tests/test_multioutput_monte_carlo.py
@@ -495,7 +495,8 @@ def test_best_model_subset_estimator(self):
         target_cost = 10
         est._save_candidate_estimators = True
         np.set_printoptions(linewidth=1000)
-        est.allocate_samples(target_cost, {"verbosity": 1, "nprocs": 1})
+        est.allocate_samples(
+            target_cost, {"verbosity": 1, "nprocs": 1, "scaling": 1.})
 
         criteria = np.array(
             [e[0]._optimized_criteria for e in est._candidate_estimators])
diff --git a/pyapprox/optimization/tests/test_l1_minimization.py b/pyapprox/optimization/tests/test_l1_minimization.py
index e2fa2920..0c2be2f0 100644
--- a/pyapprox/optimization/tests/test_l1_minimization.py
+++ b/pyapprox/optimization/tests/test_l1_minimization.py
@@ -308,7 +308,7 @@ def hess(x):
         coef = res.x
 
         print(np.linalg.norm(true_coef-coef))
-        assert np.allclose(true_coef, coef, atol=6e-3)
+        assert np.allclose(true_coef, coef, atol=7e-3)
 
     @unittest.skip(reason="test incomplete")
     def test_lasso(self):

From af48732c17cede92029fe97ae93d1fd5a0be5f00 Mon Sep 17 00:00:00 2001
From: John Jakeman <jdjakem@users.noreply.github.com>
Date: Thu, 23 May 2024 18:53:09 -0600
Subject: [PATCH 10/15] Try to fix test tolerances to account for cross
 platform differences

---
 pyapprox/expdesign/linear_oed.py                          | 1 -
 pyapprox/expdesign/tests/test_linear_oed.py               | 2 +-
 .../multifidelity/tests/test_multioutput_monte_carlo.py   | 8 ++++++--
 pyapprox/optimization/tests/test_minimize.py              | 7 +++++--
 tutorials/multi_fidelity/plot_multioutput_acv.py          | 5 ++++-
 5 files changed, 16 insertions(+), 7 deletions(-)

diff --git a/pyapprox/expdesign/linear_oed.py b/pyapprox/expdesign/linear_oed.py
index 4a68e91d..d72f8e9c 100644
--- a/pyapprox/expdesign/linear_oed.py
+++ b/pyapprox/expdesign/linear_oed.py
@@ -470,7 +470,6 @@ def doptimality_criterion(homog_outer_prods, design_factors,
     M0, M1 = get_M0_and_M1_matrices(
         homog_outer_prods, design_prob_measure, noise_multiplier,
         regression_type)
-    print(M1, "#!@, M1", np.linalg.cond(M1))
     M1_inv = np.linalg.inv(M1)
     if noise_multiplier is not None:
         gamma = M0.dot(M1_inv)
diff --git a/pyapprox/expdesign/tests/test_linear_oed.py b/pyapprox/expdesign/tests/test_linear_oed.py
index 3791c2fd..36dcc9a8 100644
--- a/pyapprox/expdesign/tests/test_linear_oed.py
+++ b/pyapprox/expdesign/tests/test_linear_oed.py
@@ -1047,7 +1047,7 @@ def test_michaelis_menten_model_minimax_d_optimal_least_squares_design(
         opt_problem = NonLinearAlphabetOptimalDesign('D', local_design_factors)
         mu = opt_problem.solve_nonlinear_minimax(
             parameter_samples, design_samples[np.newaxis, :],
-            {'iprint': 1, 'ftol': 1e-6, 'disp': True})
+            {'iprint': 1, 'ftol': 1e-4, 'disp': True})
         II = np.where(mu > 1e-5)[0]
         # given largest theta_2=1 then optimal design will be at 1/3,1
         # with masses=0.5
diff --git a/pyapprox/multifidelity/tests/test_multioutput_monte_carlo.py b/pyapprox/multifidelity/tests/test_multioutput_monte_carlo.py
index 4c167a70..e36d13b3 100644
--- a/pyapprox/multifidelity/tests/test_multioutput_monte_carlo.py
+++ b/pyapprox/multifidelity/tests/test_multioutput_monte_carlo.py
@@ -496,7 +496,9 @@ def test_best_model_subset_estimator(self):
         est._save_candidate_estimators = True
         np.set_printoptions(linewidth=1000)
         est.allocate_samples(
-            target_cost, {"verbosity": 1, "nprocs": 1, "scaling": 1.})
+            target_cost, {"verbosity": 1, "nprocs": 1, "scaling": 1.,
+                          "init_guess": {"disp": True, "maxiter": 100,
+                                         "lower_bound": 1e-3}})
 
         criteria = np.array(
             [e[0]._optimized_criteria for e in est._candidate_estimators])
@@ -525,7 +527,9 @@ def test_best_model_subset_estimator(self):
         stat = multioutput_stats["mean_variance"](len(qoi_idx))
         stat.set_pilot_quantities(cov, W, B)
         est = get_estimator("gmf", stat, costs)
-        est.allocate_samples(target_cost)
+        est.allocate_samples(target_cost,
+                             {"init_guess": {"disp": True, "maxiter": 100,
+                                             "lower_bound": 1e-3}})
         hfcovar_mc, hfcovar, covar_mc, covar, est_vals, Q, delta = (
             numerically_compute_estimator_variance(
                 funs, model.variable, est, ntrials, max_eval_concurrency, True)
diff --git a/pyapprox/optimization/tests/test_minimize.py b/pyapprox/optimization/tests/test_minimize.py
index 47cfb966..fb8329d9 100644
--- a/pyapprox/optimization/tests/test_minimize.py
+++ b/pyapprox/optimization/tests/test_minimize.py
@@ -254,7 +254,7 @@ def _jacobian(self, x):
             np.full((ndesign_vars+nconstraints,), np.inf))
         optimizer = ScipyConstrainedOptimizer(
             objective, bounds=bounds, constraints=[constraint],
-            opts={"gtol": 1e-6, "verbose": 3, "maxiter": 500})
+            opts={"gtol": 3e-6, "verbose": 3, "maxiter": 500})
         result = optimizer.minimize(opt_x0)
 
         # errors in sample based estimate of CVaR will cause
@@ -263,7 +263,10 @@ def _jacobian(self, x):
             constraint(result.x[:, None]), [CVaR1, CVaR2], rtol=1e-2)
         # print(constraint(exact_opt_x), [CVaR1, CVaR2])
         # print(result.x-exact_opt_x[:, 0], exact_opt_x[:, 0])
-        assert np.allclose(result.x, exact_opt_x[:, 0], rtol=1e-3, atol=1e-6)
+
+        # TODO: on ubuntu reducing gtol causes minimize not to converge
+        # ideally find reason and dencrease rtol and atol below
+        assert np.allclose(result.x, exact_opt_x[:, 0], rtol=2e-3, atol=1e-5)
         assert np.allclose(-sigma1, result.fun, rtol=1e-4)
 
 
diff --git a/tutorials/multi_fidelity/plot_multioutput_acv.py b/tutorials/multi_fidelity/plot_multioutput_acv.py
index 91c934dd..0f999417 100644
--- a/tutorials/multi_fidelity/plot_multioutput_acv.py
+++ b/tutorials/multi_fidelity/plot_multioutput_acv.py
@@ -32,7 +32,10 @@
 stat = mf.multioutput_stats["mean"](benchmark.nqoi)
 stat.set_pilot_quantities(cov)
 est = mf.get_estimator("gmf", stat, costs)
-est.allocate_samples(target_cost, {"scaling": 1.})
+est.allocate_samples(
+    target_cost, {"scaling": 1.,
+                  "init_guess": {"disp": True, "maxiter": 100,
+                                 "lower_bound": 1e-3}})
 
 # get covariance of just first qoi
 qoi_idx = [0]

From fdfaf1237c4d76bb7a095503f266f471a283de29 Mon Sep 17 00:00:00 2001
From: John Jakeman <jdjakem@users.noreply.github.com>
Date: Fri, 24 May 2024 12:18:57 -0600
Subject: [PATCH 11/15] Fix tolerance to account for cross platform differences
 in multioutput acv test on ubunutu

---
 pyapprox/multifidelity/tests/test_multioutput_monte_carlo.py | 2 +-
 tutorials/multi_fidelity/plot_multioutput_acv.py             | 4 ++--
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/pyapprox/multifidelity/tests/test_multioutput_monte_carlo.py b/pyapprox/multifidelity/tests/test_multioutput_monte_carlo.py
index e36d13b3..d8ee0780 100644
--- a/pyapprox/multifidelity/tests/test_multioutput_monte_carlo.py
+++ b/pyapprox/multifidelity/tests/test_multioutput_monte_carlo.py
@@ -496,7 +496,7 @@ def test_best_model_subset_estimator(self):
         est._save_candidate_estimators = True
         np.set_printoptions(linewidth=1000)
         est.allocate_samples(
-            target_cost, {"verbosity": 1, "nprocs": 1, "scaling": 1.,
+            target_cost, {"verbosity": 1, "nprocs": 1, "scaling": 5.,
                           "init_guess": {"disp": True, "maxiter": 100,
                                          "lower_bound": 1e-3}})
 
diff --git a/tutorials/multi_fidelity/plot_multioutput_acv.py b/tutorials/multi_fidelity/plot_multioutput_acv.py
index 0f999417..1d038bbc 100644
--- a/tutorials/multi_fidelity/plot_multioutput_acv.py
+++ b/tutorials/multi_fidelity/plot_multioutput_acv.py
@@ -28,12 +28,12 @@
     mf.get_correlation_from_covariance(cov), ax=ax, model_names=labels,
     label_fontsize=20)
 
-target_cost = 10
+target_cost = 30
 stat = mf.multioutput_stats["mean"](benchmark.nqoi)
 stat.set_pilot_quantities(cov)
 est = mf.get_estimator("gmf", stat, costs)
 est.allocate_samples(
-    target_cost, {"scaling": 1.,
+    target_cost, {"scaling": 5.,
                   "init_guess": {"disp": True, "maxiter": 100,
                                  "lower_bound": 1e-3}})
 

From 2a2e8d7049516ca52f8d16b428b57bd4493fc250 Mon Sep 17 00:00:00 2001
From: John Jakeman <jdjakem@users.noreply.github.com>
Date: Fri, 24 May 2024 16:55:57 -0600
Subject: [PATCH 12/15] Again trying to fix cross platform diffs

---
 pyapprox/multifidelity/tests/test_multioutput_monte_carlo.py | 4 ++--
 tutorials/multi_fidelity/plot_multioutput_acv.py             | 4 ++--
 2 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/pyapprox/multifidelity/tests/test_multioutput_monte_carlo.py b/pyapprox/multifidelity/tests/test_multioutput_monte_carlo.py
index d8ee0780..cf4fccbe 100644
--- a/pyapprox/multifidelity/tests/test_multioutput_monte_carlo.py
+++ b/pyapprox/multifidelity/tests/test_multioutput_monte_carlo.py
@@ -496,8 +496,8 @@ def test_best_model_subset_estimator(self):
         est._save_candidate_estimators = True
         np.set_printoptions(linewidth=1000)
         est.allocate_samples(
-            target_cost, {"verbosity": 1, "nprocs": 1, "scaling": 5.,
-                          "init_guess": {"disp": True, "maxiter": 100,
+            target_cost, {"verbosity": 1, "nprocs": 1, "scaling": 1,
+                          "init_guess": {"disp": True, "maxiter": 300,
                                          "lower_bound": 1e-3}})
 
         criteria = np.array(
diff --git a/tutorials/multi_fidelity/plot_multioutput_acv.py b/tutorials/multi_fidelity/plot_multioutput_acv.py
index 1d038bbc..d759dbe3 100644
--- a/tutorials/multi_fidelity/plot_multioutput_acv.py
+++ b/tutorials/multi_fidelity/plot_multioutput_acv.py
@@ -33,8 +33,8 @@
 stat.set_pilot_quantities(cov)
 est = mf.get_estimator("gmf", stat, costs)
 est.allocate_samples(
-    target_cost, {"scaling": 5.,
-                  "init_guess": {"disp": True, "maxiter": 100,
+    target_cost, {"scaling": 1.,
+                  "init_guess": {"disp": True, "maxiter": 300,
                                  "lower_bound": 1e-3}})
 
 # get covariance of just first qoi

From 2e04a9925ffe0273bb8c312e8ae431fa47e1d0cd Mon Sep 17 00:00:00 2001
From: John Jakeman <jdjakem@users.noreply.github.com>
Date: Sun, 26 May 2024 16:39:38 -0600
Subject: [PATCH 13/15] Add continuous worfklow to build docs purely with pip

---
 ...ntinuous-integration-workflow-docs-pip.yml | 50 +++++++++++++++++++
 .../tests/test_multioutput_monte_carlo.py     |  2 +-
 .../multi_fidelity/plot_multioutput_acv.py    |  2 +-
 3 files changed, 52 insertions(+), 2 deletions(-)
 create mode 100644 .github/workflows/continuous-integration-workflow-docs-pip.yml

diff --git a/.github/workflows/continuous-integration-workflow-docs-pip.yml b/.github/workflows/continuous-integration-workflow-docs-pip.yml
new file mode 100644
index 00000000..2e4bd6b3
--- /dev/null
+++ b/.github/workflows/continuous-integration-workflow-docs-pip.yml
@@ -0,0 +1,50 @@
+name: Build Docs Using Pip
+
+on:
+  # push:
+  # branches: [master]
+  # branches: [master, devel]
+  pull_request:
+    branches: [devel]
+
+  workflow_dispatch:
+
+
+#   # schedule:
+#   #  # * is a special character in YAML so you have to quote this string
+#   #  - cron:  '*/0 * * * *' # run once a day
+
+
+jobs:
+  pyapprox_unit_tests:
+    name: Build docs with pip-build
+    runs-on: ${{ matrix.os }}
+    strategy:
+      fail-fast: false
+      matrix:
+        # os: [ubuntu-latest]
+        python-version: [3.8, 3.9, '3.10', '3.11']
+        os: [ubuntu-latest, macos-latest]
+        # python-version: [3.7, 3.8] #3.8 currently fails due to numpy error
+        # solely experienced when using github actions ValueError:
+        # numpy.ndarray size changed, may indicate binary incompatibility.
+        # Expected 96 from C header, got 88 from PyObject
+
+    steps:
+      - uses: actions/checkout@v4
+      - name: Setup Python ${{ matrix.python-version }} on ${{ matrix.os }}
+        uses: actions/setup-python@v2
+        with:
+          python-version: ${{ matrix.python-version }}
+      - name: Install dependencies
+        run: |
+          python -m pip install --upgrade pip
+      - name: Setup PyApprox Documentation
+        shell: bash -l {0}
+        run: |
+          pip install -e .[docs]
+      - name: Create PyApprox Documentation
+        shell: bash -l {0}
+        run: |
+          cd docs
+          make html SPHINXOPTS=-vvv
diff --git a/pyapprox/multifidelity/tests/test_multioutput_monte_carlo.py b/pyapprox/multifidelity/tests/test_multioutput_monte_carlo.py
index cf4fccbe..2f33f00d 100644
--- a/pyapprox/multifidelity/tests/test_multioutput_monte_carlo.py
+++ b/pyapprox/multifidelity/tests/test_multioutput_monte_carlo.py
@@ -498,7 +498,7 @@ def test_best_model_subset_estimator(self):
         est.allocate_samples(
             target_cost, {"verbosity": 1, "nprocs": 1, "scaling": 1,
                           "init_guess": {"disp": True, "maxiter": 300,
-                                         "lower_bound": 1e-3}})
+                                         "lower_bound": 1e-10}})
 
         criteria = np.array(
             [e[0]._optimized_criteria for e in est._candidate_estimators])
diff --git a/tutorials/multi_fidelity/plot_multioutput_acv.py b/tutorials/multi_fidelity/plot_multioutput_acv.py
index d759dbe3..06df9440 100644
--- a/tutorials/multi_fidelity/plot_multioutput_acv.py
+++ b/tutorials/multi_fidelity/plot_multioutput_acv.py
@@ -35,7 +35,7 @@
 est.allocate_samples(
     target_cost, {"scaling": 1.,
                   "init_guess": {"disp": True, "maxiter": 300,
-                                 "lower_bound": 1e-3}})
+                                 "lower_bound": 1e-10}})
 
 # get covariance of just first qoi
 qoi_idx = [0]

From a3e263e01ec69b991bbf718c371551de16e4ecc4 Mon Sep 17 00:00:00 2001
From: John Jakeman <jdjakem@users.noreply.github.com>
Date: Mon, 27 May 2024 17:04:05 -0600
Subject: [PATCH 14/15] python3.8 is near end of life so stop running CI using
 3.8.

---
 .../continuous-integration-workflow-conda.yml         | 11 +----------
 .../continuous-integration-workflow-docs-pip.yml      |  7 +------
 .../continuous-integration-workflow-docs.yml          | 10 +---------
 .../workflows/continuous-integration-workflow-pip.yml |  2 +-
 setup.py                                              |  1 +
 5 files changed, 5 insertions(+), 26 deletions(-)

diff --git a/.github/workflows/continuous-integration-workflow-conda.yml b/.github/workflows/continuous-integration-workflow-conda.yml
index ce0098d2..7d8556a2 100644
--- a/.github/workflows/continuous-integration-workflow-conda.yml
+++ b/.github/workflows/continuous-integration-workflow-conda.yml
@@ -22,16 +22,9 @@ jobs:
     strategy:
       fail-fast: false
       matrix:
-        # os: [ubuntu-latest]
-        # pin to python-3.7.16 because github actions has a bug with _bz2 on
-        # ubunutu for 3.7.17
         # quotes needed around two-digit versions
-        python-version: [3.8, 3.9, '3.10', '3.11']
+        python-version: [3.9, '3.10', '3.11']
         os: [ubuntu-latest, macos-latest]
-        # python-version: [3.7, 3.8] #3.8 currently fails due to numpy error
-        # solely experienced when using github actions ValueError:
-        # numpy.ndarray size changed, may indicate binary incompatibility.
-        # Expected 96 from C header, got 88 from PyObject
 
     steps:
       - uses: actions/checkout@v4
@@ -40,11 +33,9 @@ jobs:
         with:
           activate-environment: pyapprox-base
           python-version: ${{ matrix.python-version }}
-          # channels: defaults,conda-forge
           channels: defaults
           environment-file: environment.yml
           auto-update-conda: true
-          # use-only-tar-bz2: true
           auto-activate-base: false
       - name: Conda list
         shell: bash -l {0}  # - l {0} is needed to activate created env
diff --git a/.github/workflows/continuous-integration-workflow-docs-pip.yml b/.github/workflows/continuous-integration-workflow-docs-pip.yml
index 2e4bd6b3..290e5cba 100644
--- a/.github/workflows/continuous-integration-workflow-docs-pip.yml
+++ b/.github/workflows/continuous-integration-workflow-docs-pip.yml
@@ -23,13 +23,8 @@ jobs:
       fail-fast: false
       matrix:
         # os: [ubuntu-latest]
-        python-version: [3.8, 3.9, '3.10', '3.11']
+        python-version: [3.9, '3.10', '3.11']
         os: [ubuntu-latest, macos-latest]
-        # python-version: [3.7, 3.8] #3.8 currently fails due to numpy error
-        # solely experienced when using github actions ValueError:
-        # numpy.ndarray size changed, may indicate binary incompatibility.
-        # Expected 96 from C header, got 88 from PyObject
-
     steps:
       - uses: actions/checkout@v4
       - name: Setup Python ${{ matrix.python-version }} on ${{ matrix.os }}
diff --git a/.github/workflows/continuous-integration-workflow-docs.yml b/.github/workflows/continuous-integration-workflow-docs.yml
index bf3e8082..bbdf0ede 100644
--- a/.github/workflows/continuous-integration-workflow-docs.yml
+++ b/.github/workflows/continuous-integration-workflow-docs.yml
@@ -22,14 +22,8 @@ jobs:
     strategy:
       fail-fast: false
       matrix:
-        # os: [ubuntu-latest]
-        python-version: [3.8, 3.9, '3.10', '3.11']
+        python-version: [3.9, '3.10', '3.11']
         os: [ubuntu-latest, macos-latest]
-        # python-version: [3.7, 3.8] #3.8 currently fails due to numpy error
-        # solely experienced when using github actions ValueError:
-        # numpy.ndarray size changed, may indicate binary incompatibility.
-        # Expected 96 from C header, got 88 from PyObject
-
     steps:
       - uses: actions/checkout@v4
       - name: Setup Miniconda with Python ${{ matrix.python-version }} on ${{ matrix.os }}
@@ -37,10 +31,8 @@ jobs:
         with:
           activate-environment: pyapprox-base
           python-version: ${{ matrix.python-version }}
-          # channels: defaults,conda-forge
           channels: defaults
           environment-file: environment.yml
-          # use-only-tar-bz2: true
           auto-update-conda: true
           auto-activate-base: false
       - name: Conda list
diff --git a/.github/workflows/continuous-integration-workflow-pip.yml b/.github/workflows/continuous-integration-workflow-pip.yml
index 813f9012..4b4ee544 100644
--- a/.github/workflows/continuous-integration-workflow-pip.yml
+++ b/.github/workflows/continuous-integration-workflow-pip.yml
@@ -23,7 +23,7 @@ jobs:
       fail-fast: false
       matrix:
         os: [macos-latest, ubuntu-latest]
-        python-version: [3.8, 3.9, '3.10', '3.11']
+        python-version: [3.9, '3.10', '3.11']
         # exclude:
         #  # stalls on github actions
         #  - os: ubuntu-latest
diff --git a/setup.py b/setup.py
index 6055cf70..7a0e09f8 100644
--- a/setup.py
+++ b/setup.py
@@ -50,6 +50,7 @@ def no_cythonize(extensions, **_ignore):
     include_dirs=[np.get_include()],
     setup_requires=['numpy >= 1.16.4', 'Cython', 'scipy >= 1.0.0'],
     install_requires=[
+        'setuptools',
         'numpy >= 1.16.4',
         'matplotlib',
         'scipy >= 1.0.0',

From 3516b120046d5e1d09f465209f04cd861b76d5a0 Mon Sep 17 00:00:00 2001
From: John Jakeman <jdjakem@users.noreply.github.com>
Date: Tue, 28 May 2024 11:06:42 -0600
Subject: [PATCH 15/15] Avoid broken setuptools for somer versions of python
 when building docs with pip

---
 .github/workflows/continuous-integration-workflow-docs-pip.yml | 2 +-
 pyproject.toml                                                 | 1 +
 setup.py                                                       | 3 ++-
 3 files changed, 4 insertions(+), 2 deletions(-)

diff --git a/.github/workflows/continuous-integration-workflow-docs-pip.yml b/.github/workflows/continuous-integration-workflow-docs-pip.yml
index 290e5cba..52cbc07c 100644
--- a/.github/workflows/continuous-integration-workflow-docs-pip.yml
+++ b/.github/workflows/continuous-integration-workflow-docs-pip.yml
@@ -26,7 +26,7 @@ jobs:
         python-version: [3.9, '3.10', '3.11']
         os: [ubuntu-latest, macos-latest]
     steps:
-      - uses: actions/checkout@v4
+      - uses: actions/checkout@v2
       - name: Setup Python ${{ matrix.python-version }} on ${{ matrix.os }}
         uses: actions/setup-python@v2
         with:
diff --git a/pyproject.toml b/pyproject.toml
index 9d47cf48..96df3529 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -27,6 +27,7 @@ classifiers=[
     "Operating System :: OS Independent",
 ]    
 dependencies = [
+    'setuptools',
     'numpy >= 1.16.4',
     'matplotlib',
     'scipy >= 1.0.0',
diff --git a/setup.py b/setup.py
index 7a0e09f8..8838f837 100644
--- a/setup.py
+++ b/setup.py
@@ -48,7 +48,8 @@ def no_cythonize(extensions, **_ignore):
         "Operating System :: OS Independent",
     ],
     include_dirs=[np.get_include()],
-    setup_requires=['numpy >= 1.16.4', 'Cython', 'scipy >= 1.0.0'],
+    setup_requires=['numpy >= 1.16.4', 'Cython', 'scipy >= 1.0.0',
+                    'setuptools'],
     install_requires=[
         'setuptools',
         'numpy >= 1.16.4',