diff --git a/.gitignore b/.gitignore
index 09768c5..296f9af 100644
--- a/.gitignore
+++ b/.gitignore
@@ -212,5 +212,6 @@ pyrightconfig.json
 # End of https://www.toptal.com/developers/gitignore/api/python,visualstudiocode
 
 .venv*
-
 Taskfile.yml
+.DS_Store
+*~
diff --git a/pyproject.toml b/pyproject.toml
index c74e6db..b36ae29 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -18,7 +18,7 @@ license = { text = "BSD-3-Clause" }
 classifiers = ["Programming Language :: Python :: 3"]
 # TODO move some dependencies into optional dependencies
 dependencies = [
-  "intersect_sdk>=0.9.0,<0.10.0",
+  "intersect_sdk>=0.9.3,<0.10.0",
   "numpy",
   "scikit-learn>=1.4.0,<2.0.0",                        # TODO consider making an optional dependency group
   "scipy>=1.12.0,<2.0.0",
diff --git a/scripts/1d_sable_client.py b/scripts/1d_sable_client.py
index 380d66c..727365b 100644
--- a/scripts/1d_sable_client.py
+++ b/scripts/1d_sable_client.py
@@ -23,6 +23,7 @@
     DialInputSingleOtherStrategy,
     DialWorkflowCreationParamsClient,
     DialWorkflowDatasetUpdate,
+    Normal,
 )
 
 mpl.use('agg')
@@ -94,6 +95,8 @@ def __init__(self, service_destination: str):
 
         self.dataset_x = self.x_raw.reshape(-1, 1).tolist()
         self.dataset_y = self.y_raw.reshape(-1).tolist()
+        self.labels_y = ['y']
+        self.statistics_y = Normal(loc='y', scale=self.noise_level)
         self.test_points = self.x_test.reshape(-1, 1).tolist()
 
         self.kernel = 'rbf'
@@ -104,7 +107,6 @@ def __init__(self, service_destination: str):
             'alpha': 0.05,
             'p': 1.25,
             'n_iter_irls': 100,
-            'noise_level': self.noise_level,
         }
         self.strategy = 'upper_confidence_bound'
         self.strategy_args = {'exploit': 0.0, 'explore': 1.0}
@@ -160,6 +162,8 @@ def callback_message(self, operation: str, **kwargs) -> IntersectClientCallback:
             next_payload = DialWorkflowCreationParamsClient(
                 dataset_x=self.dataset_x,
                 dataset_y=self.dataset_y,
+                labels_y=self.labels_y,
+                statistics_y=self.statistics_y,
                 bounds=self.bounds.tolist(),
                 kernel=self.kernel,
                 kernel_args=self.kernel_args,
@@ -216,14 +220,12 @@ def callback_message(self, operation: str, **kwargs) -> IntersectClientCallback:
 
     def handle_surrogate_values(self, payload):
         means = payload['values']
-        transformed_stddevs = payload['transformed_stddevs']
+        stddevs = payload['stddevs']
         if self.at_grids:
-            self.stddev_grid = np.array(transformed_stddevs).reshape(
-                (self.meshgrid_size,) * self.num_dims
-            )
+            self.stddev_grid = np.array(stddevs).reshape((self.meshgrid_size,) * self.num_dims)
             self.mean_grid = np.array(means).reshape((self.meshgrid_size,) * self.num_dims)
         else:
-            self.stddev_test = np.array(transformed_stddevs)
+            self.stddev_test = np.array(stddevs)
             self.mean_test = np.array(means)
             print(
                 f'Values at testing points {self.x_test.reshape(-1)}: Mean: {self.mean_test}, Stddev: {self.stddev_test}'
diff --git a/scripts/1d_sinusoidal_growth_client.py b/scripts/1d_sinusoidal_growth_client.py
index a321e46..756f4e8 100644
--- a/scripts/1d_sinusoidal_growth_client.py
+++ b/scripts/1d_sinusoidal_growth_client.py
@@ -23,6 +23,7 @@
     DialInputSingleOtherStrategy,
     DialWorkflowCreationParamsClient,
     DialWorkflowDatasetUpdate,
+    Normal,
 )
 
 mpl.use('agg')
@@ -52,14 +53,14 @@ def __init__(self):
 
 class ActiveLearningOrchestrator:
     def __init__(self, service_destination: str):
-        self.bounds = np.array([[-2, 2]])
+        self.bounds = [[-2.0, 2.0]]
         self.num_dims = len(self.bounds)
 
-        self.x_raw = np.array([[1], [2.0]])
-        self.x_test = np.array([[-1], [0.5]])
+        self.x_raw = np.array([[1.0], [2.0]])
+        self.x_test = np.array([[-1.0], [0.5]])
         self.y_raw = sinusoidal_growth(self.x_raw)
 
-        self.meshgrid_size = 100
+        self.meshgrid_size = 200
         self.grid_points = [
             np.linspace(dim_bounds[0], dim_bounds[1], self.meshgrid_size)
             for dim_bounds in self.bounds
@@ -72,18 +73,47 @@ def __init__(self, service_destination: str):
         self.dataset_y = self.y_raw.reshape(-1).tolist()
         self.test_points = self.x_test.reshape(-1, 1).tolist()
 
-        self.kernel = 'rbf'
-        self.kernel_args = {'length_scale': 0.12, 'length_scale_bounds': (0.1, 1.0)}
+        # Assume that there is some small noise in the measurements to stabilize the fit
+        self.statistics_y = Normal(loc='y', scale=1e-6)
+
         self.backend = 'sklearn'
-        self.backend_args = None
+        if self.backend == 'sklearn':
+            # configure kernel_hyperparameters
+            self.kernel = 'matern'  # 'rbf' or 'matern'
+            self.kernel_args = {
+                'length_scale': 0.1,
+                'constant_value': 1.0,
+            }
+            self.optimize_lengthscale = False
+            if self.optimize_lengthscale:
+                self.kernel_args.update(
+                    {
+                        'length_scale_bounds': (0.02, 0.2),
+                    }
+                )
+            self.backend_args = {}
+        elif self.backend == 'sable':
+            self.kernel = 'rbf'
+            self.kernel_args = {
+                'x_range': [-2.0, 2.0],
+                'sigma_range': [1.0e-3, 1.0],
+                'gamma': 0.1,
+            }
+            self.backend_args = {
+                'n_features': 10000,
+                'alpha': 0.0005,
+                'p': 1.25,
+                'n_iter_irls': 20,
+            }
+
         self.strategy = 'upper_confidence_bound'
         self.strategy_args = {'exploit': 0.4, 'explore': 1}
         self.niter = 0
         self.max_iter = 20
         self.at_grids = True
-        self.variance_grid = None
+        self.stddev_grid = None
         self.mean_grid = None
-        self.variance_test = None
+        self.stddev_test = None
         self.mean_test = None
         self.x_next = None
 
@@ -92,18 +122,23 @@ def __init__(self, service_destination: str):
         self.service_destination = service_destination
 
     def __call__(
-        self, _source: str, operation: str, _has_error: bool, payload: INTERSECT_RESPONSE_VALUE
+        self,
+        _source: str,
+        operation: str,
+        _has_error: bool,
+        payload: INTERSECT_RESPONSE_VALUE,
     ) -> IntersectClientCallback:
-        print(
-            f'Received message from {_source} with operation {operation} and payload {payload}',
-            file=sys.stderr,
-        )
         if _has_error:
             print('============ERROR==============', file=sys.stderr)
             print(operation, file=sys.stderr)
             print(payload, file=sys.stderr)
             raise IntersectCallbackError(operation, payload)
 
+        # print(
+        #     f'Received message from {_source} with operation {operation} and payload {payload}',
+        #     file=sys.stderr,
+        # )
+
         if operation == 'dial.initialize_workflow':
             self.workflow_id = payload
             return self.callback_message('dial.get_surrogate_values')
@@ -142,10 +177,8 @@ def callback_message(self, operation: str, **kwargs) -> IntersectClientCallback:
                 kernel_args=self.kernel_args,
                 backend=self.backend,
                 backend_args=self.backend_args,
-                extra_args={'length_per_dimension': True},
                 preprocess_standardize=True,
                 y_is_good=True,
-                seed=20,
             )
 
         elif operation == 'dial.get_surrogate_values':
@@ -164,7 +197,8 @@ def callback_message(self, operation: str, **kwargs) -> IntersectClientCallback:
                 workflow_id=self.workflow_id,
                 strategy=self.strategy,
                 strategy_args=self.strategy_args,
-                bounds=self.bounds.tolist(),
+                bounds=self.bounds,
+                y_is_good=True,
             )
 
         elif operation == 'dial.update_workflow_with_data':
@@ -181,23 +215,23 @@ def callback_message(self, operation: str, **kwargs) -> IntersectClientCallback:
         return IntersectClientCallback(
             messages_to_send=[
                 IntersectDirectMessageParams(
-                    destination=self.service_destination, operation=operation, payload=next_payload
+                    destination=self.service_destination,
+                    operation=operation,
+                    payload=next_payload,
                 )
             ]
         )
 
     def handle_surrogate_values(self, payload):
         means = payload['values']
-        transformed_stddevs = payload['transformed_stddevs']
+        stddevs = payload['stddevs']
         if self.at_grids:
-            self.variance_grid = np.array(transformed_stddevs).reshape(
-                (self.meshgrid_size,) * self.num_dims
-            )
+            self.stddev_grid = np.array(stddevs).reshape((self.meshgrid_size,) * self.num_dims)
             self.mean_grid = np.array(means).reshape((self.meshgrid_size,) * self.num_dims)
         else:
-            self.variance_test = np.array(transformed_stddevs)
+            self.stddev_test = np.array(stddevs)
             self.mean_test = np.array(means)
-            print(f'Test Mean: {self.mean_test}, Variance: {self.variance_test}')
+            print(f'Test Mean: {self.mean_test}, Std.Dev.: {self.stddev_test}')
 
         # end of active learning loop after max_iter
         if self.niter > self.max_iter:
@@ -224,12 +258,12 @@ def graph(self):
 
         fig, axs = plt.subplots(2, 1, figsize=(10, 8), sharex=True)
 
-        # First subplot: Mean and variance with training data
+        # First subplot: Mean and standard deviation with training data
         axs[0].plot(self.x_grid, self.mean_grid, label='Mean Prediction')
         axs[0].fill_between(
             self.x_grid[:, 0],
-            self.mean_grid + 2 * self.variance_grid,
-            self.mean_grid - 2 * self.variance_grid,
+            self.mean_grid + 2 * self.stddev_grid,
+            self.mean_grid - 2 * self.stddev_grid,
             alpha=0.5,
             label='Confidence Interval',
         )
@@ -248,19 +282,20 @@ def graph(self):
 
         # Second subplot: Acquisition function
         if self.strategy_args is not None:
-            if self.mean_grid is not None and self.variance_grid is not None:
+            if self.mean_grid is not None and self.stddev_grid is not None:
                 exploit = self.strategy_args.get('exploit', 0.0)
                 explore = self.strategy_args.get('explore', 1.0)
-                acquisition_values = exploit * self.mean_grid + explore * np.sqrt(
-                    self.variance_grid
-                )
+                acquisition_values = exploit * self.mean_grid + explore * self.stddev_grid
             else:
                 acquisition_values = np.zeros_like(self.x_grid)
 
             axs[1].plot(self.x_grid, acquisition_values)
             if self.x_next is not None:
                 axs[1].axvline(
-                    x=self.x_next[0], color='red', linestyle='--', label='Next Point (x_next)'
+                    x=self.x_next[0],
+                    color='red',
+                    linestyle='--',
+                    label='Next Point (x_next)',
                 )
             axs[1].set_xlabel('Features, x')
             axs[1].set_ylabel('Acquisition Value')
@@ -268,7 +303,7 @@ def graph(self):
             axs[1].grid(True)
 
         plt.tight_layout()
-        plt.savefig('graph.png')
+        plt.savefig('graph_sinusoidal.png')
         plt.close(fig)
 
 
diff --git a/scripts/2d_rosenbrock_client.py b/scripts/2d_rosenbrock_client.py
index af14344..9be7e92 100644
--- a/scripts/2d_rosenbrock_client.py
+++ b/scripts/2d_rosenbrock_client.py
@@ -3,6 +3,7 @@
 import logging
 import os
 import sys
+from collections import deque
 from pathlib import Path
 from typing import Any
 
@@ -22,6 +23,7 @@
 # from scipy.stats import qmc
 from dial_dataclass import (
     DialInputPredictions,
+    DialInputSingleConfidenceBound,
     DialInputSingleOtherStrategy,
     DialWorkflowCreationParamsClient,
     DialWorkflowDatasetUpdate,
@@ -65,11 +67,11 @@ def generate_dataset_x(num_dims):
 )
 INITIAL_POINTS_TO_PREDICT = np.hstack([mg.reshape(-1, 1) for mg in INITIAL_MESHGRIDS]).tolist()
 
-NUM_ITERATIONS = 35
+NUM_ITERATIONS = 200
 
 # HYPERPARAMETERS
-LENGTH_SCALE = 0.2
-NOISE_LEVEL = 10e-6
+LENGTH_SCALE = 0.1
+NOISE_LEVEL = 10e-8
 CONSTANT_VALUE = 1.0
 
 
@@ -86,6 +88,23 @@ def __init__(self, service_destination: str, rosenbrock_destination: str):
         self.dataset_x = INITIAL_DATASET_X
         self.dataset_y: list[float] = []
 
+        # we want to minimize
+        self.y_is_good = False
+
+        # Initialize a deque of strategies with desired number of iterations
+        self.strategies = deque(
+            [
+                (20, 'uncertainty', {}),
+                (40, 'upper_confidence_bound', {'exploit': 1.0, 'explore': 0.5}),
+                (40, 'confidence_bound', {'confidence_bound': 0.9}),
+                (200, 'expected_improvement', {}),
+            ]
+        )
+
+        # if we want to test discrete measurements
+        self.discrete_measurements = False
+        self.discrete_measurement_grid_size = [200, 200]
+
     # create a message to send to the server
     def assemble_message(self, operation: str, **kwargs: Any) -> IntersectClientCallback:
         if operation == 'initialize_workflow':
@@ -103,9 +122,9 @@ def assemble_message(self, operation: str, **kwargs: Any) -> IntersectClientCall
                     'constant_value': CONSTANT_VALUE,
                     'constant_value_bounds': 'fixed',
                 },
-                length_per_dimension=False,  # allow the matern to use separate length scales for the two parameters
-                y_is_good=False,  # we wish to minimize y (the error)
-                backend='sklearn',  # "sklearn" or "gpax"
+                preprocess_standardize=True,
+                y_is_good=self.y_is_good,  # we wish to minimize y (the error)
+                backend='sklearn',
                 seed=-1,  # Use seed = -1 for random results
             )
         elif operation == 'update_workflow_with_data':
@@ -114,11 +133,31 @@ def assemble_message(self, operation: str, **kwargs: Any) -> IntersectClientCall
                 **kwargs,
             )
         elif operation == 'get_next_point':
-            payload = DialInputSingleOtherStrategy(
-                workflow_id=self.workflow_id,
-                strategy='expected_improvement',
-                bounds=INITIAL_BOUNDS,
-            )
+            # select strategy
+            Niter, strategy, strategy_args = self.strategies.popleft()
+            Niter -= 1
+            if Niter > 0:
+                self.strategies.appendleft((Niter, strategy, strategy_args))
+            if strategy == 'confidence_bound':
+                payload = DialInputSingleConfidenceBound(
+                    workflow_id=self.workflow_id,
+                    bounds=INITIAL_BOUNDS,
+                    y_is_good=self.y_is_good,  # we wish to minimize y (the error)
+                    strategy='confidence_bound',
+                    confidence_bound=strategy_args['confidence_bound'],
+                    discrete_measurements=self.discrete_measurements,
+                    discrete_measurement_grid_size=self.discrete_measurement_grid_size,
+                )
+            else:
+                payload = DialInputSingleOtherStrategy(
+                    workflow_id=self.workflow_id,
+                    bounds=INITIAL_BOUNDS,
+                    y_is_good=self.y_is_good,  # we wish to minimize y (the error)
+                    strategy=strategy,
+                    strategy_args=strategy_args,
+                    discrete_measurements=self.discrete_measurements,
+                    discrete_measurement_grid_size=self.discrete_measurement_grid_size,
+                )
         elif operation == 'get_surrogate_values':
             payload = DialInputPredictions(
                 workflow_id=self.workflow_id,
@@ -179,7 +218,9 @@ def __call__(
         if operation == 'Rosenbrock.rosenbrock':
             # this operation gets called periodically
             self.dataset_y.append(payload)
-            print(f'{payload:.3f}')
+            coord_str = ', '.join([f'{x:.2f}' for x in self.dataset_x[-1]])
+            strategy = self.strategies[0][1]
+            print(f'got value {payload:.5f} at [{coord_str}] with strategy {strategy}')
             if len(self.dataset_x) == NUM_ITERATIONS:
                 minpos = np.argmin(self.dataset_y)
                 y_opt = self.dataset_y[minpos]
@@ -187,7 +228,7 @@ def __call__(
                 self.graph(optimal_coords, True)
                 coord_str = ', '.join([f'{coord:.2f}' for coord in optimal_coords])
                 print(
-                    f'Optimal simulated datapoint at ({coord_str}), y={y_opt:.3f}',
+                    f'Optimal simulated datapoint at ({coord_str}), y={y_opt:.5f}',
                     end='\n',
                     flush=True,
                 )
@@ -245,8 +286,8 @@ def graph(self, x_EI: list[float], final: bool = False):
             plt.ylabel('Simulation Parameter #2')
             # add black dots for data points and a red marker for the recommendation:
             X_train = np.array(self.dataset_x)
-            plt.scatter(X_train[:, 0], X_train[:, 1], color='black', marker='o')
-            plt.scatter(1.0, 1.0, s=300, color='None', edgecolors='black', marker='o')
+            plt.scatter(X_train[:, 0], X_train[:, 1], color='black', marker='.')
+            plt.scatter(1.0, 1.0, s=300, color='None', edgecolors='tab:orange', marker='o')
 
             minpos = np.argmin(self.dataset_y)
             optimal_coords = self.dataset_x[minpos]
@@ -258,7 +299,7 @@ def graph(self, x_EI: list[float], final: bool = False):
                     f'Best point estimate so far is x=({final_x}), y={self.dataset_y[minpos]:.3f}'
                 )
             else:
-                plt.scatter([x_EI[0]], [x_EI[1]], color='red', marker='o')
+                plt.scatter([x_EI[0]], [x_EI[1]], color='tab:red', marker='o')
                 plt.scatter(
                     [x_EI[0]],
                     [x_EI[1]],
@@ -267,7 +308,7 @@ def graph(self, x_EI: list[float], final: bool = False):
                     marker='o',
                     s=300,
                 )
-            plt.savefig('graph.png')
+            plt.savefig('graph_rosenbrock.png', dpi=200)
         else:
             fig, ax = plt.subplots(figsize=(8, 6))
             message = (
diff --git a/scripts/manual_client.py b/scripts/manual_client.py
index b3e5a03..47241db 100644
--- a/scripts/manual_client.py
+++ b/scripts/manual_client.py
@@ -135,7 +135,9 @@ def assemble_message(self, operation: str, **kwargs: Any) -> IntersectClientCall
                 dataset_y=INITIAL_DATASET_Y,
                 bounds=BOUNDS,
                 kernel='matern',
-                length_per_dimension=True,  # allow the matern to use separate length scales for the two parameters
+                extra_args={
+                    'length_per_dimension': True
+                },  # allow the matern to use separate length scales for the two parameters
                 y_is_good=False,  # we wish to minimize y (the error)
                 backend='sklearn',  # "sklearn" or "gpax"
                 seed=-1,  # Use seed = -1 for random results
@@ -149,6 +151,7 @@ def assemble_message(self, operation: str, **kwargs: Any) -> IntersectClientCall
             payload = DialInputSingleOtherStrategy(
                 workflow_id=self.workflow_id,
                 strategy='expected_improvement',
+                bounds=BOUNDS,
             )
         elif operation == 'get_surrogate_values':
             payload = DialInputPredictions(
@@ -171,7 +174,11 @@ def assemble_message(self, operation: str, **kwargs: Any) -> IntersectClientCall
     # The callback function.  This is called whenever the server responds to our message.
     # This could instead be implemented by defining a callback method (and passing it later), but here we chose to directly make the object callable.
     def __call__(
-        self, _source: str, operation: str, _has_error: bool, payload: INTERSECT_RESPONSE_VALUE
+        self,
+        _source: str,
+        operation: str,
+        _has_error: bool,
+        payload: INTERSECT_RESPONSE_VALUE,
     ) -> IntersectClientCallback:
         if _has_error:
             print('============ERROR==============', file=sys.stderr)
@@ -179,20 +186,27 @@ def __call__(
             print(payload, file=sys.stderr)
             print(file=sys.stderr)
             raise Exception  # noqa: TRY002 (break INTERSECT loop)
+
         if operation == 'dial.initialize_workflow':
             self.workflow_id: str = payload
             return self.assemble_message('get_surrogate_values')
+
         if operation == 'dial.update_workflow_with_data':
             return self.assemble_message('get_surrogate_values')
-        if (
-            operation == 'dial.get_surrogate_values'
-        ):  # if we receive a grid of surrogate values, record it for graphing, then ask for the next recommended point
-            self.mean_grid = np.array(payload['values']).reshape(XX.shape)
+
+        if operation == 'dial.get_surrogate_values':
+            # if we receive a grid of surrogate values, record it for graphing, then ask for the next recommended point
+            means = payload['values']
+            self.mean_grid = np.array(means).reshape(XX.shape)
             return self.assemble_message('get_next_point')
+
         if operation == 'dial.get_next_point':
-            # if we receive an EI recommendation, record it, show the user the current graph, and ask the user for the results of their experiment:
-            self.graph(payload)
-            return self.add_data(payload)
+            # if we receive an EI recommendation, record it, show the user the current graph,
+            # and ask the user for the results of their experiment:
+            data = payload['data']
+            self.graph(data)
+            update_message = self.add_data(data)
+            return update_message
 
         err_msg = f'Unknown operation received: {operation}'
         raise Exception(err_msg)  # noqa: TRY002 (INTERSECT interaction mechanism)
@@ -200,7 +214,13 @@ def __call__(
     # makes a color graph of the predicted yields, with markers for the training data and EI-recommended point:
     def graph(self, x_EI: list[float]):
         plt.clf()
-        plt.contourf(XX, YY, self.mean_grid, levels=np.linspace(0, 12, 101), extend='both')
+        plt.contourf(
+            XX,
+            YY,
+            self.mean_grid,
+            levels=np.linspace(0, 12, 101),
+            extend='both',
+        )
         cbar = plt.colorbar()
         cbar.set_ticks(np.linspace(0, 12, 7))
         cbar.set_label('C2H4 Yield (%)')
@@ -210,12 +230,22 @@ def graph(self, x_EI: list[float]):
         X_train = np.array(self.dataset_x)
         plt.scatter(X_train[:, 0], X_train[:, 1], color='black', marker='o')
         plt.scatter([x_EI[0]], [x_EI[1]], color='red', marker='o')
-        plt.scatter([x_EI[0]], [x_EI[1]], color='none', edgecolors='red', marker='o', s=300)
+        plt.scatter(
+            [x_EI[0]],
+            [x_EI[1]],
+            color='none',
+            edgecolors='red',
+            marker='o',
+            s=300,
+        )
         plt.savefig('graph.png')
 
     # asks the user for a data point (an experimental result) and adds it to our dataset
     def add_data(self, x_EI: list[float]):
-        print(f'\nEI recommends running at: {x_EI[0]:.1f} ms, {x_EI[1]:.1f} K', flush=True)
+        print(
+            f'\nEI recommends running at: {x_EI[0]:.1f} ms, {x_EI[1]:.1f} K',
+            flush=True,
+        )
         print('\nEnter Experimental Data:', file=sys.stderr)
         x0 = read_float('Duration (ms):')
         x1 = read_float('Temperature (K):')
diff --git a/src/dial_dataclass/__init__.py b/src/dial_dataclass/__init__.py
index 35377f2..5bc49f4 100644
--- a/src/dial_dataclass/__init__.py
+++ b/src/dial_dataclass/__init__.py
@@ -1,4 +1,5 @@
 from .dial_dataclass import (
+    Delta,
     DialInputMultiple,
     DialInputMultipleOtherStrategy,
     DialInputPredictions,
@@ -8,6 +9,7 @@
     DialWorkflowCreationParamsClient,
     DialWorkflowDatasetUpdate,
     DialWorkflowDatasetUpdates,
+    Normal,
 )
 from .dial_dataclass_responses import (
     DialDataResponse1D,
diff --git a/src/dial_dataclass/dial_dataclass.py b/src/dial_dataclass/dial_dataclass.py
index 689abbd..8f45ebc 100644
--- a/src/dial_dataclass/dial_dataclass.py
+++ b/src/dial_dataclass/dial_dataclass.py
@@ -1,20 +1,158 @@
-from typing import Annotated, Literal
+from abc import ABC
+from typing import Annotated, Any, Literal
 
-from pydantic import BaseModel, Field, field_validator
+from pydantic import (
+    BaseModel,
+    Field,
+    ValidationInfo,
+    field_validator,
+    model_validator,
+)
 
 from .pydantic_helpers import ValidatedObjectId
 
-PositiveIntType = Annotated[int, Field(ge=0)]
-
 _POSSIBLE_BACKENDS = ('sklearn', 'gpax', 'sable')
 
 BackendType = Literal[_POSSIBLE_BACKENDS]
 
+PositiveIntType = Annotated[int, Field(ge=0)]
+
+Label = Annotated[str, Field(max_length=50, description='Label for a dataset entry.')]
+FloatOrLabel = Annotated[
+    float | Label,
+    Field(
+        description='A constant float, or the label of a dataset entry.',
+    ),
+]
+
+
+class BaseDistribution(BaseModel, ABC):
+    """Base class for a statistical distribution."""
+
+    name: str
+    loc: Annotated[
+        Label,
+        Field(
+            description='The location (mean, or center) of the distribution',
+        ),
+    ]
+    scale: Annotated[
+        FloatOrLabel,
+        Field(
+            description='The scale or standard deviation of the distribution',
+        ),
+    ]
+
+
+class Delta(BaseDistribution):
+    """The Delta distribution is deterministic and equal to its mean/loc."""
+
+    name: Literal['Delta'] = Field(default='Delta', frozen=True)
+    scale: float = Field(ge=0.0, le=0.0, default=0.0, frozen=True)
+
+
+class Normal(BaseDistribution):
+    """The normal distribution is determined by loc (mean) and scale (standard deviation)."""
+
+    name: Literal['Normal'] = Field(default='Normal', frozen=True)
+
+
+Distribution = Annotated[
+    Delta | Normal,
+    Field(
+        description='Union of all supported Distributions.',
+        discriminator='name',
+    ),
+]
+
+
+def _validate_dataset_lengths(dataset: list[Any]) -> bool:
+    """validate the lengths of dataset entries"""
+    if len(dataset) > 1:
+        data = dataset[0]
+        if isinstance(data, list):
+            target_length = len(dataset[0])
+            for row in dataset[1:]:
+                if len(row) != target_length:
+                    return False
+    return True
+
+
+def _validate_dims_and_length(data: dict, x_name: str, y_name: str) -> tuple[int, int]:
+    """validate the lengths of datasets, and compute dim_x and dim_y"""
+
+    dim_x = data.get('dim_x')
+    dim_y = data.get('dim_y')
+    dataset_x = data[x_name]
+    dataset_y = data[y_name]
+
+    len_x = len(dataset_x)
+    len_y = len(dataset_y)
+
+    if len_y != len_x:
+        msg = f'Unequal number of points in {x_name} {len_x=} and {y_name} {len_y=}.'
+        raise ValueError(msg)
+
+    def compute_dim(dim, dataset, name):
+        lenn = len(dataset)
+        if dim is None and lenn == 0:
+            msg = f'Can not infer dim from empty dataset {name}.Set dim to the correct dimension.'
+            raise ValueError(msg)
+
+        if lenn > 0:
+            inferred_dim = len(dataset[0]) if isinstance(dataset[0], list) else 1
+            if dim is not None and inferred_dim != dim:
+                msg = (
+                    f'Vectors in {name} must be of length {dim=}.Set dim to the correct dimension.'
+                )
+                raise ValueError(msg)
+            dim = inferred_dim
+
+        return dim
+
+    # compute dimensions and validate consistency
+    dim_x = compute_dim(dim_x, dataset_x, x_name)
+    dim_y = compute_dim(dim_y, dataset_y, y_name)
+
+    # validate bounds, if they exist
+    bounds = data.get('bounds')
+    if bounds is not None and len(bounds) != dim_x:
+        msg = f'Bounds have incorrect length {len(bounds)} != {dim_x=}'
+        raise ValueError(msg)
+
+    return dim_x, dim_y
+
+
+def _validate_labels(cls) -> tuple[str, str]:
+    """validate the lengths of labels"""
+    labels_x, labels_y = cls.labels_x, cls.labels_y
+    dim_x, dim_y = cls.dim_x, cls.dim_y
+
+    def compute_labels(dim, labels):
+        if isinstance(labels, list):
+            if dim is not None and dim != len(labels):
+                msg = f'Labels {labels} ar not consistent with data dimension {dim=}'
+                raise ValueError(msg)
+        elif dim > 1:
+            # give each parameter a unique label by appending a number
+            labels = [f'{labels}_{i + 1}' for i in range(dim)]
+        else:
+            # normalize to single element list
+            labels = [labels]
+        return labels
+
+    labels_x = compute_labels(dim_x, labels_x)
+    labels_y = compute_labels(dim_y, labels_y)
+
+    return labels_x, labels_y
+
 
 class _DialWorkflowCreationParams(BaseModel):
     """This comprises the information needed to create a DIAL workflow.
 
-    This is a base class which should not be directly imported, clients should use "DialWorkflowCreationParamsClient" (in this file) and services should use "DialWorkflowCreationParamsService" (exported from the service)
+    This is a base class which should not be directly imported, clients should use
+    "DialWorkflowCreationParamsClient" (in this file) and services should use
+    "DialWorkflowCreationParamsService" (exported from the service)
     """
 
     dataset_x: Annotated[
@@ -27,22 +165,75 @@ class _DialWorkflowCreationParams(BaseModel):
         Field(description='The input vectors of the training data'),
     ]
     dataset_y: Annotated[
-        list[float],
+        list[
+            float
+            | Annotated[
+                list[float],
+                Field(description='Field lengths of all subarrays should be equal'),
+            ]
+        ],
+        Field(
+            description=('The output values of the training data. Length should equal dataset_x'),
+        ),
+    ]
+    labels_x: Annotated[
+        Label | list[Label],
+        Field(default='x', description='Labels for input variables x.'),
+    ]
+    labels_y: Annotated[
+        Label | list[Label],
+        Field(default='y', description='Labels for output variables y.'),
+    ]
+    dim_x: Annotated[
+        PositiveIntType | None,
         Field(
-            description='The output values of the training data. Length should equal dataset_x',
+            default=None,
+            description=(
+                'Provide the dimension of entries in dataset_x explicitly,'
+                ' e.g. if the initial dataset is empty.'
+                ' If None, it will be inferred from dataset_x if possible.'
+            ),
         ),
     ]
+    dim_y: Annotated[
+        PositiveIntType | None,
+        Field(
+            default=1,
+            description=(
+                'Provide the dimension of entries in dataset_y explicitly,'
+                ' e.g. if the initial dataset is empty.'
+                ' If None, it will be inferred from dataset_y if possible.'
+            ),
+        ),
+    ]
+    statistics_y: Annotated[
+        Distribution,
+        Field(
+            default=Delta(loc='y'),
+            description=(
+                'Provide the statistical model underlying the y data: For example:'
+                " Delta(loc='y') means that the y data is without error,"
+                " Normal(loc='y', scale=0.1) is a standard error with mean y and standard deviation 0.1"
+                " Normal(loc='y', scale='yerr') takes the std.dev. from the data column yerr."
+            ),
+        ),
+    ]
+
     y_is_good: Annotated[
         bool,
         Field(
-            default=True,  # <-- Set default here
-            description='If true, treat higher y values as better (e.g. y represents yield or profit).  If false, opposite (e.g. y represents error or waste)',
+            default=True,
+            description=(
+                'If true, treat higher y values as better'
+                ' (e.g. y represents yield or profit).'
+                ' If false, opposite (e.g. y represents error or waste)'
+            ),
         ),
     ]
     kernel: Literal['rbf', 'matern', 'linear']
     bounds: list[
         Annotated[
-            Annotated[list[float], Field(min_length=2, max_length=2)],
+            list[float],
             Field(min_length=2, max_length=2),
         ]
     ]
@@ -55,7 +246,6 @@ class _DialWorkflowCreationParams(BaseModel):
             description='Specific RNG seed - use -1 to use system default',
         ),
     ]
-    dim_x: Annotated[int, Field(default=1)]
 
     preprocess_log: bool = Field(default=False)
     preprocess_standardize: bool = Field(default=False)
@@ -73,26 +263,31 @@ class _DialWorkflowCreationParams(BaseModel):
     )
     """Miscellaneous additional arguments."""
 
-    @field_validator('dataset_x')
+    @field_validator('dataset_x', 'dataset_y')
     @classmethod
-    def ensure_consistent_dataset_x_lengths(cls, x):
-        if len(x) < 2:
-            return x
-        target_length = len(x[0])
-        for row in x[1:]:
-            if len(row) != target_length:
-                msg = 'Unequal vector lengths in dataset_x'
-                raise ValueError(msg)
-        return x
+    def ensure_consistent_dataset_lengths(cls, dataset, info: ValidationInfo):
+        is_valid = _validate_dataset_lengths(dataset)
+        if not is_valid:
+            msg = f'Unequal vector lengths in {info.field_name}'
+            raise ValueError(msg)
+        return dataset
 
     # order rows as [low, high] - do NOT error out here, we can efficiently handle normalization
-    @field_validator('bounds')
+    @field_validator('bounds', mode='after')
     @classmethod
     def order_bounds(cls, bounds: list[list[float]]):
         for row in bounds:
             row.sort()
         return bounds
 
+    @model_validator(mode='after')
+    def validate_dims_and_length(self):
+        # compute the dimensions and validate consistency
+        self.dim_x, self.dim_y = _validate_dims_and_length(vars(self), 'dataset_x', 'dataset_y')
+        # compute or validate labels
+        self.labels_x, self.labels_y = _validate_labels(self)
+        return self
+
 
 # this class is specific to clients; they have no way of knowing which backends the Service supports, so we allow all of them
 class DialWorkflowCreationParamsClient(_DialWorkflowCreationParams):
@@ -102,6 +297,8 @@ class DialWorkflowCreationParamsClient(_DialWorkflowCreationParams):
 
 
 class DialWorkflowDatasetUpdate(BaseModel):
+    """This class is used to send a single update to the dataset."""
+
     workflow_id: ValidatedObjectId
     next_x: list[float] = Field(
         description='The next collection of X values you want to append to your overall data',
@@ -125,6 +322,8 @@ class DialWorkflowDatasetUpdate(BaseModel):
 
 
 class DialWorkflowDatasetUpdates(BaseModel):
+    """This class is used to send multiple updates to the dataset."""
+
     workflow_id: ValidatedObjectId
     next_x_list: list[list[float]] = Field(min_length=1)
     next_y_list: list[float] = Field(min_length=1)
@@ -132,30 +331,63 @@ class DialWorkflowDatasetUpdates(BaseModel):
     backend_args: dict[str, float | int | bool | str | list[float] | tuple] | None = None
     extra_args: dict[str, float | int | bool | str | list[float] | tuple] | None = None
 
+    @field_validator('next_x_list', 'next_y_list')
+    @classmethod
+    def ensure_consistent_dataset_x_lengths(cls, dataset, ctx):
+        is_valid = _validate_dataset_lengths(dataset)
+        if not is_valid:
+            msg = f'Unequal vector lengths in {ctx.field_name}'
+            raise ValueError(msg)
+        return dataset
+
+    @model_validator(mode='after')
+    def validate_dims_and_length(self):
+        _validate_dims_and_length(vars(self), 'next_x_list', 'next_y_list')
+        return self
+
 
 class DialInputSingleConfidenceBound(BaseModel):
+    """This class is used to request a single next point using the confidence_bound strategy."""
+
     workflow_id: ValidatedObjectId
     strategy: Literal['confidence_bound']
     strategy_args: dict[str, float | int | bool] | None = Field(default=None)
     y_is_good: Annotated[
-        bool,
+        bool | None,
         Field(
-            default=True,  # <-- Set default here
-            description='If true, treat higher y values as better (e.g. y represents yield or profit).  If false, opposite (e.g. y represents error or waste)',
+            default=None,
+            description=(
+                'If true, treat higher y values as better (e.g. y represents yield or profit).'
+                ' If false, opposite (e.g. y represents error or waste).'
+                ' If None, the value from DialWorkflowCreationParams is used.'
+            ),
         ),
     ]
-    bounds: list[
-        Annotated[
-            Annotated[list[float], Field(min_length=2, max_length=2)],
-            Field(min_length=2, max_length=2),
-        ]
+    bounds: Annotated[
+        None
+        | list[
+            Annotated[
+                Annotated[list[float], Field(min_length=2, max_length=2)],
+                Field(min_length=2, max_length=2),
+            ]
+        ],
+        Field(default=None),
+    ]
+    seed: Annotated[
+        int,
+        Field(
+            default=-1,
+            ge=-1,
+            le=4294967295,
+            description='Specific RNG seed - use -1 to use system default',
+        ),
     ]
     extra_args: dict[str, float | int | bool | str | list[float] | tuple] | None = Field(
         default=None
     )
     """These extra arguments will be MERGED with the saved extra_args, with these arguments taking place over the saved values when applicable."""
     optimization_points: PositiveIntType = Field(default=1000)
-    confidence_bound: float = Field(gt=0.5, lt=1)
+    confidence_bound: float = Field(gt=0.5, lt=1.0)
     discrete_measurements: bool = Field(default=False)
     discrete_measurement_grid_size: list[PositiveIntType] = Field(default=[20, 20])
     point_index: Annotated[
@@ -168,6 +400,8 @@ class DialInputSingleConfidenceBound(BaseModel):
 
 
 class DialInputSingleOtherStrategy(BaseModel):
+    """This class is used to request a single next point using a given strategy."""
+
     workflow_id: ValidatedObjectId
     strategy: Literal[
         'random',
@@ -180,17 +414,25 @@ class DialInputSingleOtherStrategy(BaseModel):
     ]
     strategy_args: dict[str, float | int | bool] | None = Field(default=None)
     y_is_good: Annotated[
-        bool,
+        bool | None,
         Field(
-            default=True,  # <-- Set default here
-            description='If true, treat higher y values as better (e.g. y represents yield or profit).  If false, opposite (e.g. y represents error or waste)',
+            default=None,
+            description=(
+                'If true, treat higher y values as better (e.g. y represents yield or profit).'
+                ' If false, opposite (e.g. y represents error or waste).'
+                ' If None, the value from DialWorkflowCreationParams is used.'
+            ),
         ),
     ]
-    bounds: list[
-        Annotated[
-            Annotated[list[float], Field(min_length=2, max_length=2)],
-            Field(min_length=2, max_length=2),
-        ]
+    bounds: Annotated[
+        None
+        | list[
+            Annotated[
+                Annotated[list[float], Field(min_length=2, max_length=2)],
+                Field(min_length=2, max_length=2),
+            ]
+        ],
+        Field(default=None),
     ]
     seed: Annotated[
         int,
@@ -227,6 +469,8 @@ class DialInputSingleOtherStrategy(BaseModel):
 
 
 class DialInputMultipleOtherStrategy(BaseModel):
+    """This class is used to request multiple next points (of number points) using a given strategy."""
+
     workflow_id: ValidatedObjectId
     points: PositiveIntType
     strategy: Literal[
@@ -240,17 +484,25 @@ class DialInputMultipleOtherStrategy(BaseModel):
     ]
     strategy_args: dict[str, float | int | bool] | None = Field(default=None)
     y_is_good: Annotated[
-        bool,
+        bool | None,
         Field(
-            default=True,  # <-- Set default here
-            description='If true, treat higher y values as better (e.g. y represents yield or profit).  If false, opposite (e.g. y represents error or waste)',
+            default=None,
+            description=(
+                'If true, treat higher y values as better (e.g. y represents yield or profit).'
+                ' If false, opposite (e.g. y represents error or waste).'
+                ' If None, the value from DialWorkflowCreationParams is used.'
+            ),
         ),
     ]
-    bounds: list[
-        Annotated[
-            Annotated[list[float], Field(min_length=2, max_length=2)],
-            Field(min_length=2, max_length=2),
-        ]
+    bounds: Annotated[
+        None
+        | list[
+            Annotated[
+                Annotated[list[float], Field(min_length=2, max_length=2)],
+                Field(min_length=2, max_length=2),
+            ]
+        ],
+        Field(default=None),
     ]
     seed: Annotated[
         int,
@@ -280,6 +532,7 @@ class DialInputPredictions(BaseModel):
     """This is the input dataclass for Dial for requesting a surrogate evaluation at a given number of points."""
 
     workflow_id: ValidatedObjectId
+
     points_to_predict: list[list[float]]
     extra_args: dict[str, float | int | bool | str | list[float] | tuple] | None = Field(
         default=None
diff --git a/src/dial_dataclass/dial_dataclass_responses.py b/src/dial_dataclass/dial_dataclass_responses.py
index b7cc4f8..cfcd806 100644
--- a/src/dial_dataclass/dial_dataclass_responses.py
+++ b/src/dial_dataclass/dial_dataclass_responses.py
@@ -43,10 +43,8 @@ class DialSurrogateValuesResponse(BaseModel):
 
     values: list[float]
     """The computed values (for example, from Gaussian backends, the means) from calling get_surrogate_values()"""
-    transformed_stddevs: list[float]
-    """The computed uncertainties from calling get_surrogate_values(), with an inverse transform. If inverse-transforming is not possible (due to log-preprocessing), this will be all -1"""
-    stddevs: list[float]  # TODO will probably remove in future
-    """The computed raw uncertainties from calling get_surrogate_values(), without an inverse transform"""
+    stddevs: list[float]
+    """The computed uncertainties from calling get_surrogate_values(), with an inverse transform."""
     dim_x: int
     """Number of dimensions of the associated data, derived from workflow"""
     bounds: list[list[float]]
@@ -57,5 +55,5 @@ class DialSurrogateValuesResponse(BaseModel):
     """The same workflow ID that was used to get the data, to facilitate possible load balancing."""
     dataset_x_size: int
     """Current length of dataset_x"""
-    transformed_stddevs_avg: float
-    """the average of the transformed stddevs being returned"""
+    stddevs_avg: float
+    """The average of the transformed stddevs being returned"""
diff --git a/src/dial_service/backends/gpax_backend.py b/src/dial_service/backends/gpax_backend.py
index ee0b064..0b45bba 100644
--- a/src/dial_service/backends/gpax_backend.py
+++ b/src/dial_service/backends/gpax_backend.py
@@ -14,9 +14,7 @@ class GpaxBackend(AbstractBackend[gpax.viGP, str, tuple[jnp.ndarray, jnp.ndarray
     @staticmethod
     def train_model(data):
         """Generate a trained model."""
-        rng_key_train, rng_key_predict = gpax.utils.get_keys(
-            seed=data.seed if data.seed != -1 else None
-        )
+        rng_key_train, _ = gpax.utils.get_keys(seed=data.seed if data.seed != -1 else None)
         gp_model = gpax.viGP(len(data.bounds), GpaxBackend.get_kernel(data), guide='delta')
         gp_model.fit(
             rng_key_train,
@@ -32,21 +30,17 @@ def train_model(data):
     @staticmethod
     def initialize_model(data):
         """Generate an untrained model."""
-        rng_key_train, rng_key_predict = gpax.utils.get_keys(
-            seed=data.seed if data.seed != -1 else None
-        )
         return gpax.viGP(len(data.bounds), GpaxBackend.get_kernel(data), guide='delta')
 
     @staticmethod
     def predict(model, data):
-        rng_key_train, rng_key_predict = gpax.utils.get_keys(
-            seed=data.seed if data.seed != -1 else None
-        )
+        _, rng_key_predict = gpax.utils.get_keys(seed=data.seed if data.seed != -1 else None)
         x = data.x_predict
         # mean, y_var = model.predict(rng_key_predict, data.x_predict)
         # TODO check why model.predict().reshape() fails
         mean, y_var = model.predict(rng_key_predict, x.reshape(1, -1))
-        return mean[0], data.stddev * y_var[0]
+        # return the square root of the variance (the standard deviation)
+        return mean[0], jnp.sqrt(y_var[0])
 
     @staticmethod
     def get_kernel(data):
diff --git a/src/dial_service/backends/sable_backend.py b/src/dial_service/backends/sable_backend.py
index b53e283..ba637b5 100644
--- a/src/dial_service/backends/sable_backend.py
+++ b/src/dial_service/backends/sable_backend.py
@@ -30,17 +30,20 @@ def _get_model_kwargs(data) -> dict:
 
 def _get_observation_errors(data, n_observations: int) -> np.ndarray:
     backend_args = {} if data.backend_args is None else data.backend_args
-    y_err = backend_args.get('y_err', backend_args.get('noise_level', 1e-6))
-    # TODO figure this out: We need a consistent way to configure alpha / noise_level / y_err
 
-    y_err_arr = np.asarray(y_err, dtype=float).reshape(-1)
-    if y_err_arr.size == 1:
-        y_err_arr = np.full(n_observations, float(y_err_arr[0]), dtype=float)
-
-    if data.preprocess_standardize and len(data.Y_raw) > 0:
-        scale = np.std(np.asarray(data.Y_raw, dtype=float))
-        if scale > 0:
-            y_err_arr = y_err_arr / scale
+    if data.statistics_y.name == 'Normal':
+        y_err = data.Yerr_train
+        y_err_arr = np.asarray(y_err, dtype=float).reshape(-1)
+        if y_err_arr.size == 1:
+            y_err_arr = np.full(n_observations, float(y_err_arr[0]), dtype=float)
+    else:
+        # if y_err is not provided through the statistics, use the old fallback for compatibility
+        # TODO: remove if no longer needed
+        y_err = backend_args.get('y_err', backend_args.get('noise_level', 1e-6))
+
+        y_err_arr = np.asarray(y_err, dtype=float).reshape(-1)
+        if y_err_arr.size == 1:
+            y_err_arr = np.full(n_observations, float(y_err_arr[0]), dtype=float)
 
     return y_err_arr
 
diff --git a/src/dial_service/backends/sklearn_backend.py b/src/dial_service/backends/sklearn_backend.py
index e70cde7..2d649fe 100644
--- a/src/dial_service/backends/sklearn_backend.py
+++ b/src/dial_service/backends/sklearn_backend.py
@@ -33,7 +33,8 @@ def _filter_kwargs_for(cls, params: dict) -> dict:
     """Keep only kwargs that `cls.__init__` actually accepts."""
     sig = inspect.signature(cls.__init__)
     allowed = set(sig.parameters) - {'self', 'args', 'kwargs'}
-    return {k: v for k, v in params.items() if k in allowed}
+    params_filtered = {k: v for k, v in params.items() if k in allowed}
+    return params_filtered
 
 
 class SklearnBackend(
@@ -45,70 +46,86 @@ def get_kernel(data):
         if kernel_name not in _KERNELS_SKLEARN:
             msg = f'Unknown kernel {kernel_name}'
             raise ValueError(msg)
-        _params = {} if data.kernel_args is None else data.kernel_args
 
+        _params = {} if data.kernel_args is None else data.kernel_args.copy()
+
+        # if length_scale is not provided, but extra_args['length_per_direction'],
+        # configure a default learnable dimension dependent length_scale
         if 'length_scale' not in _params:
             length_per_dimension = (
                 data.extra_args.get('length_per_dimension') if data.extra_args else False
             )
-            # TODO check if necessary
-            # dim = data.X_train.shape[1]
-            # _params['length_scale'] = [1.0] * dim if length_per_dimension else 1.0
             _params['length_scale'] = [1.0] * data.dim_x if length_per_dimension else 1.0
+            _params['length_scale_bounds'] = (1e-05, 100000.0)
 
         base_kernel_cls = _KERNELS_SKLEARN[kernel_name]
         base_params = _filter_kwargs_for(base_kernel_cls, _params)
 
-        # Only do hyperparameter optimization if the user asks for it
-        # TODO make the default parameters for the kernels different from the sklearn defaults, but allow the user to customize it
-        const_params = {'constant_value_bounds': 'fixed', 'constant_value': 1.0}
-        const_params.update(_filter_kwargs_for(ConstantKernel, _params))
-        white_params = {'noise_level_bounds': 'fixed', 'noise_level': 1e-6}
-        white_params.update(_filter_kwargs_for(WhiteKernel, _params))
-
+        # only do hyperparameter optimization if the user asks for it, use fixed defaults
         if base_kernel_cls == DotProduct:
-            base_params = {'sigma_0': 1.0, 'sigma_0_bounds': 'fixed'}
+            base_params = {'sigma_0': 1.0, 'sigma_0_bounds': 'fixed'} | base_params
         else:
-            base_params = {'length_scale': 1.0, 'length_scale_bounds': 'fixed'}
-        base_params.update(_filter_kwargs_for(base_kernel_cls, _params))
-
-        constant_kernel = ConstantKernel(**const_params)
+            base_params = {'length_scale': 1.0, 'length_scale_bounds': 'fixed'} | base_params
         base_kernel = base_kernel_cls(**base_params)
-        white_kernel = WhiteKernel(**white_params)
 
-        return constant_kernel * base_kernel + white_kernel
+        # scale the prior variance by using a ConstantKernel
+        const_params = _filter_kwargs_for(ConstantKernel, _params)
+        if const_params:
+            # use a fixed value by default, unless bounds are explicitly provided
+            const_params = {'constant_value': 1.0, 'constant_value_bounds': 'fixed'} | const_params
+            constant_kernel = ConstantKernel(**const_params)
+            kernel = constant_kernel * base_kernel
+        else:
+            kernel = base_kernel
+
+        # if requested, add a WhiteKernel with variance noise_level
+        white_params = _filter_kwargs_for(WhiteKernel, _params)
+        if white_params:
+            # use a fixed value by default, unless bounds are explicitly provided
+            white_params = {'noise_level': 1e-12, 'noise_level_bounds': 'fixed'} | white_params
+            white_kernel = WhiteKernel(**white_params)
+            kernel = kernel + white_kernel
+
+        return kernel
 
     @staticmethod
     def train_model(data):
         """Create a model with training."""
-        if data.backend_args is None:
-            _extra_args = {}
-        else:
-            _extra_args = data.backend_args.copy()  # Ensure it's a dictionary
-            if 'alpha' in _extra_args and not isinstance(_extra_args['alpha'], np.ndarray):
-                # Process alpha as a numpy array
-                _extra_args['alpha'] = np.array(_extra_args['alpha'])
-        # print(_extra_args['alpha'])
-        model = GaussianProcessRegressor(
-            kernel=SklearnBackend.get_kernel(data), n_restarts_optimizer=1000, **_extra_args
-        )
+        model = SklearnBackend.initialize_model(data)
+
+        # print(f'pre-training kernel: {SklearnBackend.get_kernel(data)}')
         model.fit(data.X_train, data.Y_train)
+        # print(f'obtained trained kernel: {model.kernel_}')
+
         return model
 
     @staticmethod
     def initialize_model(data):
         """Create a model without training."""
-        if data.backend_args is None:
-            _extra_args = {}
-        else:
-            _extra_args = data.backend_args.copy()  # Ensure it's a dictionary
-            if 'alpha' in _extra_args and not isinstance(_extra_args['alpha'], np.ndarray):
+        kernel = SklearnBackend.get_kernel(data)
+
+        # if the output statistics are a normal distribution, configure the alpha argument for sklearn
+        _statistics_args = {}
+        if data.statistics_y.name == 'Normal':
+            # set alpha to the variance associated to Y_err_train
+            y_variance_train = data.Yerr_train**2
+            _statistics_args['alpha'] = y_variance_train
+
+        _extra_args = {}
+        if data.backend_args is not None:
+            # copy backend_args
+            _extra_args = data.backend_args.copy()
+
+            # backwards compatible way to set alpha
+            if 'alpha' in _extra_args:
                 # Process alpha as a numpy array
-                _extra_args['alpha'] = np.array(_extra_args['alpha'])
+                _extra_args['alpha'] = np.asarray(_extra_args['alpha'])
+
+        # update alpha from statistics_args, if present
+        # TODO: should raise a warning, if already present, or if WhiteKernel is present
+        _extra_args.update(_statistics_args)
 
-        return GaussianProcessRegressor(
-            kernel=SklearnBackend.get_kernel(data), n_restarts_optimizer=1000, **_extra_args
-        )
+        return GaussianProcessRegressor(kernel=kernel, n_restarts_optimizer=1000, **_extra_args)
 
     @staticmethod
     def predict(model, data):
diff --git a/src/dial_service/core.py b/src/dial_service/core.py
index 61f52ba..d7b616d 100644
--- a/src/dial_service/core.py
+++ b/src/dial_service/core.py
@@ -102,21 +102,26 @@ def get_surrogate_values(
     """
     Get surrogate model predictions for given input points.
 
-    Model parameter should be a pretrained model, you can usually call core.train_model with the same data parameter if you don't yet have a model.
+    Model parameter should be a pretrained model,
+    you can usually call core.train_model with the same data parameter if you don't yet have a model.
 
     Args:
         client_data (DialInputPredictions): Input data containing prediction points and model parameters.
 
     Returns:
-        tuple[list[float], list[float], list[float], float]: A tuple containing means, transformed standard deviations, raw standard deviations, and a float value.
+        tuple[list[float], list[float], float]: A tuple containing means, standard deviations,
+              standard deviations, and average standard deviation.
     """
     backend = data.backend.lower()
     module = get_backend_module(backend)
     means, stddevs = module.predict(model, data)
-    means = data.inverse_transform(means)
-    transformed_stddevs = data.inverse_transform(stddevs, is_stddev=True)
-    average = np.sqrt(np.mean(np.asarray(transformed_stddevs) ** 2))
-    return (means.tolist(), transformed_stddevs.tolist(), stddevs.tolist(), float(average))
+    means, stddevs = data.inverse_transform_Y(means, stddevs)
+    average_stddev = np.sqrt(np.mean(np.asarray(stddevs) ** 2))
+    return (
+        means.tolist(),
+        stddevs.tolist(),
+        float(average_stddev),
+    )
 
 
 def train_model(data: ServersideInputBase) -> Any:
diff --git a/src/dial_service/dial_service.py b/src/dial_service/dial_service.py
index db8ea61..bc1a5be 100644
--- a/src/dial_service/dial_service.py
+++ b/src/dial_service/dial_service.py
@@ -93,7 +93,6 @@ def update_workflow_with_data(
     ) -> ValidatedObjectId:
         """Updates the DB with the provided params. Success of operation is based off whether or not the INTERSECT response is an error."""
 
-        # TODO - all exceptions should realistically provide error information to the client. INTERSECT-SDK v0.9 will introduce a specific exception we can throw which will allow us to do this.
         try:
             db_get_result = self.mongo_handler.get_workflow(update_params.workflow_id)
         except Exception:
@@ -239,13 +238,7 @@ def get_next_point(self, client_data: DialInputSingle) -> DialDataResponse1D:
         try:
             model = pickle.loads(workflow_state['model'])  # noqa: S301 (XXX - this is technically trusted data as long as the DB hasn't been modified)
             validated_state = DialWorkflowCreationParamsService(**workflow_state)
-            if client_data.extra_args:
-                if validated_state.extra_args:
-                    validated_state.extra_args.update(client_data.extra_args)
-                else:
-                    validated_state.extra_args = client_data.extra_args
             data = ServersideInputSingle(validated_state, client_data)
-
             return_data = core.get_next_point(data, model)
             return DialDataResponse1D(
                 data=return_data,
@@ -285,13 +278,7 @@ def get_next_points(self, client_data: DialInputMultiple) -> DialDataResponse2D:
         try:
             model = pickle.loads(workflow_state['model'])  # noqa: S301 (XXX - this is technically trusted data as long as the DB hasn't been modified)
             validated_state = DialWorkflowCreationParamsService(**workflow_state)
-            if client_data.extra_args:
-                if validated_state.extra_args:
-                    validated_state.extra_args.update(client_data.extra_args)
-                else:
-                    validated_state.extra_args = client_data.extra_args
             data = ServersideInputMultiple(validated_state, client_data)
-
             return_data = core.get_next_points(data, model)
             return DialDataResponse2D(
                 data=return_data,
@@ -309,10 +296,11 @@ def get_next_points(self, client_data: DialInputMultiple) -> DialDataResponse2D:
     def get_surrogate_values(
         self, client_data: DialInputPredictions
     ) -> DialSurrogateValuesResponse:
-        """Trains a model then returns 3 lists based on user-supplied points:
-        - Predicted values.  These are inverse transformed (undoing the preprocessing to put them on the same scale as dataset_y)
-        - Inverse-transformed uncertainties.  If inverse-transforming is not possible (due to log-preprocessing), this will be all -1
-        - Uncertainties without inverse transformation
+        """Trains a model then returns two lists based on user-supplied points:
+        - Predicted values.
+          These are inverse transformed (undoing the preprocessing to put them on the same scale as dataset_y)
+        - Uncertainties.
+          These are inverse transformed standard errors, transformed according to the differential of the transform.
 
         Additional metadata is also returned in the response.
         """
@@ -340,17 +328,16 @@ def get_surrogate_values(
                     validated_state.extra_args = client_data.extra_args
             data = ServersideInputPrediction(validated_state, client_data)
 
-            return_data = core.get_surrogate_values(data, model)
+            means, stddevs, average_stddev = core.get_surrogate_values(data, model)
             return DialSurrogateValuesResponse(
-                values=return_data[0],
-                transformed_stddevs=return_data[1],
-                stddevs=return_data[2],
+                values=means,
+                stddevs=stddevs,
                 dim_x=validated_state.dim_x,
                 points_to_predict=client_data.points_to_predict,
                 bounds=validated_state.bounds,
                 workflow_id=client_data.workflow_id,
                 dataset_x_size=len(validated_state.dataset_x),
-                transformed_stddevs_avg=return_data[3],
+                stddevs_avg=average_stddev,
             )
         except Exception as err:
             logger.exception(
diff --git a/src/dial_service/serverside_data.py b/src/dial_service/serverside_data.py
index 78f0541..0602da2 100644
--- a/src/dial_service/serverside_data.py
+++ b/src/dial_service/serverside_data.py
@@ -14,8 +14,13 @@
 # this is an extended version of ActiveLearningInputData.  This allows us to add on properties and methods to this class without impacting the client side
 class ServersideInputBase:
     def __init__(self, data: DialWorkflowCreationParamsService):
-        self.X_raw = np.array(data.dataset_x)
-        self.Y_raw = np.array(data.dataset_y)
+        self.dim_x = data.dim_x
+        self.dim_y = data.dim_y
+        self.labels_x = data.labels_x
+        self.labels_y = data.labels_y
+        self.dataset_x = np.array(data.dataset_x)
+        self.dataset_y = np.array(data.dataset_y).reshape((-1, self.dim_y))
+        self.statistics_y = data.statistics_y
         # it seems like there should be a smarter way to do this, but stuff involving loops doesn't work with static autocompleters:
         self.bounds = data.bounds
         self.y_is_good = data.y_is_good
@@ -28,26 +33,18 @@ def __init__(self, data: DialWorkflowCreationParamsService):
         self.backend_args = data.backend_args
         self.kernel_args = data.kernel_args
         self.extra_args = data.extra_args
-        self.dim_x = data.dim_x
 
     @cached_property
-    def stddev(self) -> float:
-        return np.std(self.Y_train)
-
-    @cached_property
-    def Y_best(self) -> float:
-        return self.Y_train.max() if self.y_is_good else self.Y_train.min()
+    def X_train(self) -> np.ndarray:
+        """
+        Return X scaled to [0, 1] per dimension based on self.bounds.
 
-    @cached_property
-    def Y_train(self) -> np.ndarray:
-        y = self.Y_raw
-        if self.preprocess_log:
-            y = np.log(y)
-        if self.preprocess_standardize:
-            y = (y - np.mean(y)) / np.std(y)
-        return y
+        dataset_x: list[list[float]], shape (N, D)
+        bounds: list[[low, high], ...], shape (D, 2)
+        """
+        return self.scale_X(self.dataset_x)
 
-    def _scale_X(self, X: np.ndarray) -> np.ndarray:
+    def scale_X(self, X: np.ndarray) -> np.ndarray:
         """
         Scale X into [0, 1]^D using self.bounds.
         X: array of shape (N, D)
@@ -65,33 +62,120 @@ def _scale_X(self, X: np.ndarray) -> np.ndarray:
 
         return (X - lows) / span
 
+    def _extract_y_train_from_dataset(self):
+        """
+        Find output y and error values yerr in dataset_y, and save.
+        """
+        if hasattr(self, 'y_train_raw') and hasattr(self, 'yerr_train_raw'):
+            # only compute this on first invocation
+            return
+
+        y_label = self.statistics_y.loc
+        if not isinstance(y_label, str):
+            msg = 'statistics_y.loc must be a Label (str).'
+            raise TypeError(msg)
+
+        # Use the label from self.statistics_y.loc to find the data column with the mean y data
+        # this may trigger a ValueError, if the label does not exist, but should be handled by dataclass validation
+        pos_y = self.labels_y.index(y_label)
+        self.y_train_raw = self.dataset_y[:, pos_y]
+
+        yerr_label = self.statistics_y.scale
+        if isinstance(yerr_label, float):
+            self.yerr_train_raw = yerr_label
+        else:
+            # yerr_label is str
+            # this may trigger a ValueError, but should be handled by dataclass validation
+            pos_yerr = self.labels_y.index(yerr_label)
+            self.yerr_train_raw = self.dataset_y[:, pos_yerr]
+
+        if np.any(self.yerr_train_raw < 0):
+            idxs = np.where(np.yerr_train_raw < 0)
+            msg = f'yerr values in statistics_y.scale must be non-negative, found {np.yerr_train_raw[idxs[0]]} at {idxs[0]}.'
+            raise ValueError(msg)
+
     @cached_property
-    def X_train(self) -> np.ndarray:
+    def Y_train(self) -> np.ndarray:
         """
-        Return X scaled to [0, 1] per dimension based on self.bounds.
+        Find output y and error values yerr in dataset_y, and apply transformation.
+        Return transformed y value.
+        """
+        # ensure that self.y_train_raw, self.yerr_train_raw are populated
+        self._extract_y_train_from_dataset()
 
-        dataset_x: list[list[float]], shape (N, D)
-        bounds: list[[low, high], ...], shape (D, 2)
+        y, _ = self.transform_Y(self.y_train_raw, self.yerr_train_raw)
+
+        # return only y, to conform to interface
+        return y
+
+    @cached_property
+    def Yerr_train(self) -> any:
+        """
+        Find output y and error values in dataset y, and apply transformation.
+        Return transformed yerr value.
         """
-        return self._scale_X(self.X_raw)
+        # ensure that self.y_train_raw, self.yerr_train_raw are populated
+        self._extract_y_train_from_dataset()
+
+        # recompute transformation, at some overhead (probably not worth to optimize)
+        _, yerr = self.transform_Y(self.y_train_raw, self.yerr_train_raw)
 
-    # undoes the preprocessing.
-    def inverse_transform(self, data: np.ndarray, is_stddev: bool = False):
-        if len(self.Y_raw) == 0:
-            return data
+        # return only yerr, to conform to interface
+        return yerr
 
-        # not possible to un-log the standard deviations (-1 +- 1 in log space != .1 +- 10 in realspace)
-        if self.preprocess_log and is_stddev:
-            return np.repeat(-1, len(data))
+    def _transform_Y_params(self) -> tuple[float, float]:
+        """
+        Return the appropriate mean and scaling of the raw y data for normalization
+        """
+        # ensure that self.y_train_raw, self.yerr_train_raw are populated
+        self._extract_y_train_from_dataset()
+
+        # find y_std from y_train_raw
+        y_train = self.y_train_raw
+        if len(y_train) > 0 and self.preprocess_standardize:
+            if self.preprocess_log:
+                y_train = np.log(y_train)
+            y_std = np.std(y_train)
+            y_mean = np.mean(y_train)
+        else:
+            y_std = 1.0
+            y_mean = 0.0
+
+        return y_mean, y_std
+
+    def transform_Y(self, y: np.ndarray, yerr: any) -> tuple[np.ndarray, any]:
+        """
+        Transform y and yerr according to preprocess options
+        """
+        if self.preprocess_log:
+            yerr = yerr / y
+            y = np.log(y)
+
+        if self.preprocess_standardize:
+            y_mean, y_std = self._transform_Y_params()
+            yerr = yerr / y_std
+            y = (y - y_mean) / y_std
+
+        return y, yerr
+
+    def inverse_transform_Y(self, y: np.ndarray, yerr: any) -> tuple[np.ndarray, any]:
+        """
+        Inverse transforms of y and yerr, in reverse order
+        """
         if self.preprocess_standardize:
-            # the data that was used to calculate the standardization:
-            prestandardized_y = np.log(self.Y_raw) if self.preprocess_log else self.Y_raw
-            data = data * np.std(prestandardized_y)  # not the same as *= (which is in-place)
-            if not is_stddev:
-                data = data + np.mean(prestandardized_y)
+            y_mean, y_std = self._transform_Y_params()
+            y = y_mean + y_std * y
+            yerr = y_std * yerr
+
         if self.preprocess_log:
-            data = np.exp(data)
-        return data
+            y = np.exp(y)
+            yerr = y * yerr
+
+        return y, yerr
+
+    @cached_property
+    def Y_best(self) -> float:
+        return self.Y_train.max() if self.y_is_good else self.Y_train.min()
 
 
 class ServersideInputSingle(ServersideInputBase):
@@ -101,27 +185,42 @@ def __init__(
         params: DialInputSingle,
     ):
         super().__init__(workflow_state)
+        # set new inputs
         self.strategy = params.strategy
         self.strategy_args = params.strategy_args
-        self.y_is_good = params.y_is_good
-        self.bounds = params.bounds
-        self.numpy_rng = np.random.RandomState(None if params.seed == -1 else params.seed)
-
         self.optimization_points = params.optimization_points
         self.confidence_bound = (
             params.confidence_bound if params.strategy == 'confidence_bound' else 0.0
         )
+        # if params.strategy == 'confidence_bound':
+        #    self.confidence_bound = params.confidence_bound
+        # elif self.strategy_args is not None and 'confidence_bounds' in self.strategy_args:
+        #    self.confidence_bound = params.strategy_args['confidence_bound']
         self.discrete_measurements = params.discrete_measurements
         self.discrete_measurement_grid_size = params.discrete_measurement_grid_size
         self.point_index = params.point_index
 
+        # update values from workflow initialization, if provided
+        if params.extra_args is not None:
+            if self.extra_args is not None:
+                self.extra_args.update(params.extra_args)
+            else:
+                self.extra_args = params.extra_args
+        if params.y_is_good is not None:
+            self.y_is_good = params.y_is_good
+        if params.bounds is not None:
+            self.bounds = params.bounds
+
+        # always reinit rng, since initial rng is not updated in db!
+        self.numpy_rng = np.random.RandomState(None if params.seed == -1 else params.seed)
+
     def set_x_predict(self, X_raw: np.ndarray) -> None:
         """
         Store raw prediction points and their scaled version.
         X_raw: shape (N, D) or (D,) for a single point.
         """
         raw_vals = np.asarray(X_raw, dtype=float).reshape(-1, self.dim_x)
-        self.x_predict = self._scale_X(raw_vals)
+        self.x_predict = self.scale_X(raw_vals)
 
 
 class ServersideInputMultiple(ServersideInputBase):
@@ -130,15 +229,12 @@ def __init__(
         workflow_state: DialWorkflowCreationParamsService,
         params: DialInputMultiple,
     ):
+        # set new inputs
         super().__init__(workflow_state)
         self.strategy = params.strategy
         self.points = params.points
         self.strategy = params.strategy
         self.strategy_args = params.strategy_args
-        self.y_is_good = params.y_is_good
-        self.bounds = params.bounds
-        self.numpy_rng = np.random.RandomState(None if params.seed == -1 else params.seed)
-
         self.optimization_points = params.optimization_points
         self.confidence_bound = (
             params.confidence_bound if params.strategy == 'confidence_bound' else 0.0
@@ -146,13 +242,27 @@ def __init__(
         self.discrete_measurements = params.discrete_measurements
         self.discrete_measurement_grid_size = params.discrete_measurement_grid_size
 
+        # update values from workflow initialization, if provided
+        if params.extra_args is not None:
+            if self.extra_args is not None:
+                self.extra_args.update(params.extra_args)
+            else:
+                self.extra_args = params.extra_args
+        if params.y_is_good is not None:
+            self.y_is_good = params.y_is_good
+        if params.bounds is not None:
+            self.bounds = params.bounds
+
+        # always reinit rng, since initial rng is not updated in db!
+        self.numpy_rng = np.random.RandomState(None if params.seed == -1 else params.seed)
+
     def set_x_predict(self, X_raw: np.ndarray) -> None:
         """
         Store raw prediction points and their scaled version.
         X_raw: shape (N, D) or (D,) for a single point.
         """
         raw_vals = np.asarray(X_raw, dtype=float).reshape(-1, self.dim_x)
-        self.x_predict = self._scale_X(raw_vals)
+        self.x_predict = self.scale_X(raw_vals)
 
 
 class ServersideInputPrediction(ServersideInputBase):
@@ -171,4 +281,4 @@ def set_x_predict(self, X_raw: np.ndarray) -> None:
         X_raw: shape (N, D) or (D,) for a single point.
         """
         raw_vals = np.asarray(X_raw, dtype=float).reshape(-1, self.dim_x)
-        self.x_predict = self._scale_X(raw_vals)
+        self.x_predict = self.scale_X(raw_vals)
diff --git a/src/dial_service/utilities/strategies.py b/src/dial_service/utilities/strategies.py
index e0b42be..51d155a 100644
--- a/src/dial_service/utilities/strategies.py
+++ b/src/dial_service/utilities/strategies.py
@@ -16,10 +16,14 @@ def random_in_bounds(bounds: list[list[float]], rng: np.random.RandomState):
 
 
 def uncertainty_sampling(_mean, stddev, _data):
+    """Measure of uncertainty (stddev) for maximization"""
     return stddev
 
 
 def upper_confidence_bound(mean, stddev, data):
+    """Upper confidence bound for maximization
+    If y_is_good = False, multiply mean by -1.
+    """
     _params = data.strategy_args
     y_is_good = data.y_is_good
     _direction = 1 if y_is_good else -1
@@ -31,6 +35,10 @@ def upper_confidence_bound(mean, stddev, data):
 
 
 def upper_confidence_bound_nomad(mean, stddev, data):
+    """Upper confidence bound (NOMAD specific version) for maximization
+    Masks the values around the last measurement point to force exploration.
+    If y_is_good = False, multiply mean by -1.
+    """
     _params = data.strategy_args
     y_is_good = data.y_is_good
     _direction = 1 if y_is_good else -1
@@ -49,20 +57,30 @@ def upper_confidence_bound_nomad(mean, stddev, data):
 
 
 def expected_improvement(mean, stddev, data):
+    """Expected Improvement (EI) for maximization
+    If y_is_good = False, multiply mean and data value by -1.
+    """
     _params = data.strategy_args
     y_is_good = data.y_is_good
+    _direction = 1 if y_is_good else -1
 
-    if stddev < 1e-8:
-        return 0.0
-    z = (mean - data.Y_best) / stddev * (1 if y_is_good else -1)
-    return -stddev * (z * norm.cdf(z) + norm.pdf(z))
+    # guard against small or negative stddev
+    stddev = np.maximum(stddev, 1e-15)
+
+    z = (mean - data.Y_best) / stddev * _direction
+    return stddev * (z * norm.cdf(z) + norm.pdf(z))
 
 
 def confidence_bound(mean, stddev, data):
+    """Confidence bound for maximization
+    The same as upper_confidence_bound with exploit = 1., explore = norm.ppf(0.5 + data.confidence_bound / 2)
+    If y_is_good = False, multiply mean by -1.
+    """
     y_is_good = data.y_is_good
+    _direction = 1 if y_is_good else -1
     z_value = norm.ppf(0.5 + data.confidence_bound / 2)
 
-    return -z_value * stddev + mean * (-1 if y_is_good else 1)
+    return _direction * mean + z_value * stddev
 
 
 STRATEGIES = {
@@ -122,19 +140,18 @@ def to_minimize(_x: np.ndarray):
 
     if data.discrete_measurements:
         _measurement_grid = create_measurement_grid(data)
-        # TODO - commented line is known to fail for expected_improvement regarding discrete measurements
-        # response_surface = to_minimize(_measurement_grid)
-        response_surface = [to_minimize(point) for point in _measurement_grid]
+        response_surface = to_minimize(_measurement_grid)
         index = np.int64(np.argmin(response_surface))
         selected_point = _measurement_grid[index]
         logger.debug('selected point with discrete measurements')
         logger.debug(selected_point)
         return selected_point
 
-    n_restarts = 10
+    n_restarts = 25
     init_array = np.array(hypercube(data.bounds, n_restarts, data.numpy_rng))
     best_score = np.inf
     selected_point = None
+    # out_list = []
     for x_init in init_array:
         res = minimize(
             to_minimize,
@@ -146,6 +163,12 @@ def to_minimize(_x: np.ndarray):
         if res.fun < best_score:
             best_score = res.fun
             selected_point = res.x
+        # out_list.append((x_init.tolist(), res.x.tolist(), res.fun))
+
+    logger.debug('selected point with optimization')
+    logger.debug('score and point: %f, %s', best_score, str(selected_point))
+    # print(f'optimized: {best_score}, {selected_point}:', '\n',
+    #       '\n'.join([str(out) for out in out_list]))
 
     return selected_point.tolist()
 
diff --git a/tests/benchmarks/test_strainmap.py b/tests/benchmarks/test_strainmap.py
index 0b3cd4b..2bca51c 100644
--- a/tests/benchmarks/test_strainmap.py
+++ b/tests/benchmarks/test_strainmap.py
@@ -255,7 +255,7 @@ def run_simulation(
             points_to_predict=INITIAL_POINTS_TO_PREDICT,
         ),
     )
-    surrogate_mean, surrogate_std, _, _ = dial_core.get_surrogate_values(data, model)
+    surrogate_mean, surrogate_std, _ = dial_core.get_surrogate_values(data, model)
     mean_grid = np.array(surrogate_mean).reshape((-1, 1))
 
     # subtract the true values and save mean absolute error and standard deviation
diff --git a/tests/unit/test_internals.py b/tests/unit/test_internals.py
index ca96d21..a84d894 100644
--- a/tests/unit/test_internals.py
+++ b/tests/unit/test_internals.py
@@ -36,8 +36,6 @@ def single_1D(backend, strategy, strategy_args):
         kernel_args={
             'length_scale': 0.5,
             'length_scale_bounds': 'fixed',
-            'noise_level': 0.0,
-            'noise_level_bounds': 'fixed',
             'constant_value': 1.0,
             'constant_value_bounds': 'fixed',
         },
@@ -66,8 +64,6 @@ def single_1D_discrete_grid(backend, strategy, strategy_args, discrete_measureme
         kernel_args={
             'length_scale': 0.5,
             'length_scale_bounds': 'fixed',
-            'noise_level': 0.0,
-            'noise_level_bounds': 'fixed',
             'constant_value': 1.0,
             'constant_value_bounds': 'fixed',
         },
@@ -124,8 +120,6 @@ def single_2D(
         kernel_args={
             'length_scale': 0.15,
             'length_scale_bounds': 'fixed',
-            'noise_level': 0.0,
-            'noise_level_bounds': 'fixed',
             'constant_value': 1.0,
             'constant_value_bounds': 'fixed',
         },
@@ -239,15 +233,12 @@ def single_3D(backend, strategy, strategy_args, discrete_measurement_grid_size=N
         kernel_args={
             'length_scale': 0.15,
             'length_scale_bounds': 'fixed',
-            'noise_level': 0.0,
-            'noise_level_bounds': 'fixed',
             'constant_value': 1.0,
             'constant_value_bounds': 'fixed',
         },
         backend=backend,
         preprocess_standardize=True,
         y_is_good=True,
-        extra_args={'length_per_dimension': True},
         seed=42,
     )
     params = DialInputSingleOtherStrategy(
@@ -266,9 +257,9 @@ def multiple_2D(backend, strategy, discrete_measurement_grid_size=None):
     workflow_state = DialWorkflowCreationParamsService(
         dataset_x=[],
         dataset_y=[],
+        dim_x=2,  # provide dim_x for empty dataset
         y_is_good=False,
         kernel='rbf',
-        length_per_dimension=False,
         bounds=[[0, 100], [-1, 1]],
         backend=backend,
         seed=42,
@@ -293,15 +284,12 @@ def prediction_1D(backend):
         kernel_args={
             'length_scale': 0.5,
             'length_scale_bounds': 'fixed',
-            'noise_level': 0.0,
-            'noise_level_bounds': 'fixed',
             'constant_value': 50.0**2,
             'constant_value_bounds': 'fixed',
         },
         backend=backend,
         preprocess_standardize=False,
         y_is_good=True,
-        extra_args={'length_per_dimension': True},
         seed=42,
     )
     params = DialInputPredictions(
@@ -404,7 +392,7 @@ def test_uncertainty(backend, approx):
 @pytest.mark.parametrize(
     ('backend', 'approx'),
     [
-        ('sklearn', [1.037454]),
+        ('sklearn', [1.790396262]),
         # ('gpax', [2.0]),
     ],
 )
@@ -617,7 +605,7 @@ def test_hypercube_multiple_points(backend):
 
 
 @pytest.mark.parametrize(
-    ('backend', 'expected_means', 'expected_stddevs', 'expected_raw_stddevs'),
+    ('backend', 'expected_means', 'expected_stddevs'),
     [
         (
             'sklearn',
@@ -629,7 +617,6 @@ def test_hypercube_multiple_points(backend):
                 199.99999999,
             ],
             [2.11126987e01, 2.96625069e01, 2.11126987e01],
-            [21.11269870647274, 29.662506906581378, 21.112698706472752],
         ),
         # (
         # 'gpax',
@@ -641,46 +628,54 @@ def test_hypercube_multiple_points(backend):
         #     82.26569221517353,
         # ],
         # [3335.7290084812175, 3327.202331393974, 3335.7290084812175],
-        # [3335.7290084812175, 3327.202331393974, 3335.7290084812175],
         # ),
     ],
 )
-def test_surrogate(backend, expected_means, expected_stddevs, expected_raw_stddevs):
+def test_surrogate(backend, expected_means, expected_stddevs):
     data = prediction_1D(backend)
     model = core.train_model(data)
-    means, stddevs, raw_stddevs, _ = core.get_surrogate_values(data, model)
+    means, stddevs, _ = core.get_surrogate_values(data, model)
     assert means == pytest.approx(expected_means)
     assert stddevs[1:4] == pytest.approx(expected_stddevs)
-    assert raw_stddevs[1:4] == pytest.approx(expected_raw_stddevs)
 
 
 @pytest.mark.parametrize(
     ('backend'),
     [
         ('sklearn'),
-        # ('gpax'),
     ],
 )
 def test_inverse_transform(backend):
     data = prediction_1D(backend)
-    assert data.inverse_transform(np.array([-1, 0, 1])) == pytest.approx([-1, 0, 1])
-    assert data.inverse_transform(np.array([-1, 0, 1]), True) == pytest.approx([-1, 0, 1])
+
+    test_y = np.array([-1, 0, 1])
+    test_yerr = np.array([0.1, 1, 10])
+
+    def test_transform(inv_y, inv_yerr):
+        y, yerr = data.transform_Y(inv_y, inv_yerr)
+        assert y == pytest.approx(test_y)
+        assert yerr == pytest.approx(test_yerr)
+
+    inv_y, inv_yerr = data.inverse_transform_Y(test_y, test_yerr)
+    assert inv_y == pytest.approx(test_y)
+    assert inv_yerr == pytest.approx(test_yerr)
+    test_transform(inv_y, inv_yerr)
 
     data.preprocess_log = True
-    assert data.inverse_transform(np.array([-1, 0, 1])) == pytest.approx(
-        [1 / E_CONSTANT, 1, E_CONSTANT]
-    )
-    assert data.inverse_transform(np.array([-1, 0, 1]), True) == pytest.approx([-1, -1, -1])
+    inv_y, inv_yerr = data.inverse_transform_Y(test_y, test_yerr)
+    assert inv_y == pytest.approx([1 / E_CONSTANT, 1, E_CONSTANT])
+    assert inv_yerr == pytest.approx(inv_y * test_yerr)
+    test_transform(inv_y, inv_yerr)
 
     data.preprocess_log = False
     data.preprocess_standardize = True
-    assert data.inverse_transform(np.array([-1, 0, 1])) == pytest.approx([100, 150, 200])
-    assert data.inverse_transform(np.array([-1, 0, 1]), True) == pytest.approx(
-        [-50, 0, 50]
-    )  # technically improper, as uncertainties can't be negative
+    inv_y, inv_yerr = data.inverse_transform_Y(test_y, test_yerr)
+    assert inv_y == pytest.approx([100, 150, 200])
+    assert inv_yerr == pytest.approx(50 * test_yerr)
+    test_transform(inv_y, inv_yerr)
 
     data.preprocess_log = True
-    assert data.inverse_transform(np.array([-1, 0, 1])) == pytest.approx(
-        [100, 141.42135623730945, 200]
-    )  # TODO
-    assert data.inverse_transform(np.array([-1, 0, 1]), True) == pytest.approx([-1, -1, -1])
+    inv_y, inv_yerr = data.inverse_transform_Y(test_y, test_yerr)
+    assert inv_y == pytest.approx([100, 141.42135623730945, 200])
+    assert inv_yerr == pytest.approx(inv_y * 0.34657359027997243 * test_yerr)
+    test_transform(inv_y, inv_yerr)
diff --git a/uv.lock b/uv.lock
index bc5466a..0e595b0 100644
--- a/uv.lock
+++ b/uv.lock
@@ -697,7 +697,7 @@ dev = [
 requires-dist = [
     { name = "furo", marker = "extra == 'docs'", specifier = ">=2023.3.27" },
     { name = "gpax", specifier = ">=0.1.8" },
-    { name = "intersect-sdk", specifier = ">=0.9.0,<0.10.0" },
+    { name = "intersect-sdk", specifier = ">=0.9.3,<0.10.0" },
     { name = "numpy" },
     { name = "numpyro", specifier = "<0.20.1" },
     { name = "pymongo", specifier = ">=4.12.1" },
@@ -1102,20 +1102,32 @@ wheels = [
 
 [[package]]
 name = "intersect-sdk"
-version = "0.9.0"
+version = "0.9.3"
 source = { registry = "https://pypi.org/simple" }
 dependencies = [
+    { name = "intersect-sdk-common" },
     { name = "jsonschema", extra = ["format-nongpl"] },
+    { name = "psutil" },
+    { name = "pydantic" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/ad/4a/4197405ffa4d42913d3358cf34d1b0ec15a841c994c5931b3785a975a86a/intersect_sdk-0.9.3.tar.gz", hash = "sha256:b0f563ae161f7851c1281fd4023222ce6509af33fae371f776470d1767dcfb7c", size = 54468, upload-time = "2026-06-23T16:02:18.534Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/f0/53/a2fb84ca204d3b794c6c9e93487d38169a075b9422ca27d5b95a794528c2/intersect_sdk-0.9.3-py3-none-any.whl", hash = "sha256:d02b87b07134de96e060054750cd82445334a573f5df34a451d4d786118c904b", size = 66750, upload-time = "2026-06-23T16:02:17.437Z" },
+]
+
+[[package]]
+name = "intersect-sdk-common"
+version = "0.9.6"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
     { name = "minio" },
     { name = "paho-mqtt" },
     { name = "pika" },
-    { name = "psutil" },
     { name = "pydantic" },
-    { name = "retrying" },
 ]
-sdist = { url = "https://files.pythonhosted.org/packages/26/4e/8671bcef8b222626aad9a615328c8b8823d577919d26f78b095018c0d715/intersect_sdk-0.9.0.tar.gz", hash = "sha256:76413ea6307e58b1e664a391e10cc2e31bcb899c4fee4e5e6f8c640fcebbd244", size = 108556, upload-time = "2026-02-11T19:32:24.078Z" }
+sdist = { url = "https://files.pythonhosted.org/packages/d7/65/83884f05d52241d0fe3362baaca4b08bfd447b9360daeb52dcfa9bfa8b63/intersect_sdk_common-0.9.6.tar.gz", hash = "sha256:b46e2a155f9f73c2fa621c0a1c212f97dd90f53f856e61d30faa5dc7986f7ecd", size = 32223, upload-time = "2026-06-02T21:23:19.529Z" }
 wheels = [
-    { url = "https://files.pythonhosted.org/packages/dd/b7/4ce6222b6bffcae9413115298caea7b37c5b3b97f68746a27b4bc06ef9ff/intersect_sdk-0.9.0-py3-none-any.whl", hash = "sha256:6aa3c05d053c54b0f7c314bc8c618952a1c5c5d91427cd86e6c5c4851a2a60f3", size = 100771, upload-time = "2026-02-11T19:32:22.506Z" },
+    { url = "https://files.pythonhosted.org/packages/0a/2a/3085cce8374b733c0255cc1d35889d42d1452bf33e681a996754bec77ebb/intersect_sdk_common-0.9.6-py3-none-any.whl", hash = "sha256:8947769d54eab04c4da3adbb403f0c224c07faf76a45f98e372ae112130adaf8", size = 45082, upload-time = "2026-06-02T21:23:20.407Z" },
 ]
 
 [[package]]
@@ -2992,15 +3004,6 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/a0/f4/c67b0b3f1b9245e8d266f0f112c500d50e5b4e83cb6f3b71b6528104182a/requests-2.34.2-py3-none-any.whl", hash = "sha256:2a0d60c172f83ac6ab31e4554906c0f3b3588d37b5cb939b1c061f4907e278e0", size = 73075, upload-time = "2026-05-14T19:25:26.443Z" },
 ]
 
-[[package]]
-name = "retrying"
-version = "1.4.2"
-source = { registry = "https://pypi.org/simple" }
-sdist = { url = "https://files.pythonhosted.org/packages/c8/5a/b17e1e257d3e6f2e7758930e1256832c9ddd576f8631781e6a072914befa/retrying-1.4.2.tar.gz", hash = "sha256:d102e75d53d8d30b88562d45361d6c6c934da06fab31bd81c0420acb97a8ba39", size = 11411, upload-time = "2025-08-03T03:35:25.189Z" }
-wheels = [
-    { url = "https://files.pythonhosted.org/packages/67/f3/6cd296376653270ac1b423bb30bd70942d9916b6978c6f40472d6ac038e7/retrying-1.4.2-py3-none-any.whl", hash = "sha256:bbc004aeb542a74f3569aeddf42a2516efefcdaff90df0eb38fbfbf19f179f59", size = 10859, upload-time = "2025-08-03T03:35:23.829Z" },
-]
-
 [[package]]
 name = "rfc3339-validator"
 version = "0.1.4"