ise new RDP also in simulations

gschramm · gschramm · commit 63d050e3576d · 2024-08-28T16:57:43.000+02:00
diff --git a/simulations/stochastic_grad.py b/simulations/stochastic_grad.py
@@ -18,15 +18,18 @@
 
 from utils import (
     SubsetNegPoissonLogLWithPrior,
-    RDP,
     split_fwd_model,
     OSEM,
     SGD,
     SVRG,
     rdp_preconditioner,
-    neighbor_product,
 )
 
+import sys
+
+sys.path.append("../")
+from rdp import RDP, neighbor_product
+
 # choose a device (CPU or CUDA GPU)
 if "numpy" in xp.__name__:
     # using numpy, device must be cpu
@@ -71,9 +74,9 @@
 svrg_gradient_recalc_periods = [x for x in range(0, num_epochs_sgd, 2)]
 # (initial) step sizes to try
 step_sizes = [
-    0.5,
+    0.3,
     1.0,
-    2.0,
+    3.0,
 ]  # step size 0 means that quick and dirty line search is used
 
 # max number of updates for reference L-BFGS-B solution
@@ -289,14 +292,32 @@
 prior = RDP(
     img_shape,
     xp=xp,
-    eps=float(xp.max(x_osem)) / 100,
     dev=dev,
+    voxel_size=xp.asarray(voxel_size, device=dev),
+    eps=float(xp.max(x_osem)) / 100,
     gamma=gamma_rdp,
 )
 
-prior.weights = neighbor_product(kappa_img, xp)
+prior.kappa = kappa_img
 prior.scale = beta
 
+adjoint_ones = pet_lin_op.adjoint(
+    xp.ones(pet_lin_op.out_shape, device=dev, dtype=xp.float32)
+)
+
+## %%
+# x = x_init.copy()
+# h = prior.diag_hessian(x)
+# d_data = to_device(adjoint_ones, "cpu")
+# d_prior = to_device(h * x, "cpu")
+#
+## %%
+# import pymirc.viewer as pv
+# vi = pv.ThreeAxisViewer([d_data, d_prior, d_data > d_prior])
+
+# %%
+
+
 pet_subset_lin_op_seq, subset_slices = split_fwd_model(pet_lin_op, num_subsets_sgd)
 
 cost_function = SubsetNegPoissonLogLWithPrior(
@@ -335,9 +356,6 @@
 
 x_osem_scale = float(xp.mean(x_init))
 
-adjoint_ones = pet_lin_op.adjoint(
-    xp.ones(pet_lin_op.out_shape, device=dev, dtype=xp.float32)
-)
 
 # %%
 cost_osem = cost_function(x_osem)
diff --git a/simulations/utils.py b/simulations/utils.py
@@ -305,147 +305,147 @@ def _approx_diag_hessian(self, x: Array) -> Array:
         return diag_hes
 
 
-def neighbor_difference_and_sum(
-    x: Array, xp: ModuleType, padding: str = "edge"
-) -> tuple[Array, Array]:
-    """get differences and sums with nearest neighbors for an n-dimensional array x
-    using padding (by default in edge mode)
-    a x.ndim*(3,) neighborhood around each element is used
-    """
-    x_padded = xp.pad(x, 1, mode=padding)
-
-    # number of nearest neighbors
-    num_neigh = 3**x.ndim - 1
-
-    # array for differences and sums with nearest neighbors
-    d = xp.zeros((num_neigh,) + x.shape, dtype=x.dtype)
-    s = xp.zeros((num_neigh,) + x.shape, dtype=x.dtype)
-
-    for i, ind in enumerate(xp.ndindex(x.ndim * (3,))):
-        if i != (num_neigh // 2):
-            sl = []
-            for j in ind:
-                if j - 2 < 0:
-                    sl.append(slice(j, j - 2))
-                else:
-                    sl.append(slice(j, None))
-            sl = tuple(sl)
-
-            if i < num_neigh // 2:
-                d[i] = x - x_padded[sl]
-                s[i] = x + x_padded[sl]
-            else:
-                d[i - 1] = x - x_padded[sl]
-                s[i - 1] = x + x_padded[sl]
-
-    return d, s
-
-
-def neighbor_product(x: Array, xp: ModuleType, padding: str = "edge") -> Array:
-    """get backward and forward neighbor products for each dimension of an array x
-    using padding (by default in edge mode)
-    """
-    x_padded = xp.pad(x, 1, mode=padding)
-
-    # number of nearest neighbors
-    num_neigh = 3**x.ndim - 1
-
-    # array for differences and sums with nearest neighbors
-    p = xp.zeros((num_neigh,) + x.shape, dtype=x.dtype)
-
-    for i, ind in enumerate(xp.ndindex(x.ndim * (3,))):
-        if i != (num_neigh // 2):
-            sl = []
-            for j in ind:
-                if j - 2 < 0:
-                    sl.append(slice(j, j - 2))
-                else:
-                    sl.append(slice(j, None))
-            sl = tuple(sl)
-
-            if i < num_neigh // 2:
-                p[i] = x * x_padded[sl]
-            else:
-                p[i - 1] = x * x_padded[sl]
-
-    return p
-
-
-class RDP(SmoothFunctionWithApproxHessian):
-    def __init__(
-        self,
-        in_shape: tuple[int, ...],
-        xp: ModuleType,
-        dev: str,
-        eps: float | None = None,
-        gamma: float = 2.0,
-        padding: str = "edge",
-    ) -> None:
-        self._gamma = gamma
-
-        if eps is None:
-            self._eps = xp.finfo(xp.float32).eps
-        else:
-            self._eps = eps
-
-        self._padding = padding
-
-        self._weights = None
-
-        super().__init__(in_shape=in_shape, xp=xp, dev=dev)
-
-    @property
-    def gamma(self) -> float:
-        return self._gamma
-
-    @property
-    def eps(self) -> float:
-        return self._eps
-
-    @property
-    def weights(self) -> Array | None:
-        return self._weights
-
-    @weights.setter
-    def weights(self, weights: Array) -> None:
-        self._weights = weights
-
-    def _call(self, x: Array) -> float:
-
-        if float(self.xp.min(x)) < 0:
-            return self.xp.inf
-
-        d, s = neighbor_difference_and_sum(x, self.xp, padding=self._padding)
-        phi = s + self.gamma * self.xp.abs(d) + self.eps
-
-        tmp = (d**2) / phi
-
-        if self._weights is not None:
-            tmp *= self._weights
-
-        return float(self.xp.sum(tmp))
-
-    def _gradient(self, x: Array) -> Array:
-        d, s = neighbor_difference_and_sum(x, self.xp, padding=self._padding)
-        phi = s + self.gamma * self.xp.abs(d) + self.eps
-
-        tmp = d * (2 * phi - (d + self.gamma * self.xp.abs(d))) / (phi**2)
-
-        if self._weights is not None:
-            tmp *= self._weights
-
-        return 2 * tmp.sum(axis=0)
-
-    def _approx_diag_hessian(self, x: Array) -> Array:
-        d, s = neighbor_difference_and_sum(x, self.xp, padding=self._padding)
-        phi = s + self.gamma * self.xp.abs(d) + self.eps
-
-        tmp = ((s - d + self.eps) ** 2) / (phi**3)
-
-        if self._weights is not None:
-            tmp *= self._weights
-
-        return 4 * tmp.sum(axis=0)
+# def neighbor_difference_and_sum(
+#    x: Array, xp: ModuleType, padding: str = "edge"
+# ) -> tuple[Array, Array]:
+#    """get differences and sums with nearest neighbors for an n-dimensional array x
+#    using padding (by default in edge mode)
+#    a x.ndim*(3,) neighborhood around each element is used
+#    """
+#    x_padded = xp.pad(x, 1, mode=padding)
+#
+#    # number of nearest neighbors
+#    num_neigh = 3**x.ndim - 1
+#
+#    # array for differences and sums with nearest neighbors
+#    d = xp.zeros((num_neigh,) + x.shape, dtype=x.dtype)
+#    s = xp.zeros((num_neigh,) + x.shape, dtype=x.dtype)
+#
+#    for i, ind in enumerate(xp.ndindex(x.ndim * (3,))):
+#        if i != (num_neigh // 2):
+#            sl = []
+#            for j in ind:
+#                if j - 2 < 0:
+#                    sl.append(slice(j, j - 2))
+#                else:
+#                    sl.append(slice(j, None))
+#            sl = tuple(sl)
+#
+#            if i < num_neigh // 2:
+#                d[i] = x - x_padded[sl]
+#                s[i] = x + x_padded[sl]
+#            else:
+#                d[i - 1] = x - x_padded[sl]
+#                s[i - 1] = x + x_padded[sl]
+#
+#    return d, s
+#
+#
+# def neighbor_product(x: Array, xp: ModuleType, padding: str = "edge") -> Array:
+#    """get backward and forward neighbor products for each dimension of an array x
+#    using padding (by default in edge mode)
+#    """
+#    x_padded = xp.pad(x, 1, mode=padding)
+#
+#    # number of nearest neighbors
+#    num_neigh = 3**x.ndim - 1
+#
+#    # array for differences and sums with nearest neighbors
+#    p = xp.zeros((num_neigh,) + x.shape, dtype=x.dtype)
+#
+#    for i, ind in enumerate(xp.ndindex(x.ndim * (3,))):
+#        if i != (num_neigh // 2):
+#            sl = []
+#            for j in ind:
+#                if j - 2 < 0:
+#                    sl.append(slice(j, j - 2))
+#                else:
+#                    sl.append(slice(j, None))
+#            sl = tuple(sl)
+#
+#            if i < num_neigh // 2:
+#                p[i] = x * x_padded[sl]
+#            else:
+#                p[i - 1] = x * x_padded[sl]
+#
+#    return p
+#
+#
+# class RDP(SmoothFunctionWithApproxHessian):
+#    def __init__(
+#        self,
+#        in_shape: tuple[int, ...],
+#        xp: ModuleType,
+#        dev: str,
+#        eps: float | None = None,
+#        gamma: float = 2.0,
+#        padding: str = "edge",
+#    ) -> None:
+#        self._gamma = gamma
+#
+#        if eps is None:
+#            self._eps = xp.finfo(xp.float32).eps
+#        else:
+#            self._eps = eps
+#
+#        self._padding = padding
+#
+#        self._weights = None
+#
+#        super().__init__(in_shape=in_shape, xp=xp, dev=dev)
+#
+#    @property
+#    def gamma(self) -> float:
+#        return self._gamma
+#
+#    @property
+#    def eps(self) -> float:
+#        return self._eps
+#
+#    @property
+#    def weights(self) -> Array | None:
+#        return self._weights
+#
+#    @weights.setter
+#    def weights(self, weights: Array) -> None:
+#        self._weights = weights
+#
+#    def _call(self, x: Array) -> float:
+#
+#        if float(self.xp.min(x)) < 0:
+#            return self.xp.inf
+#
+#        d, s = neighbor_difference_and_sum(x, self.xp, padding=self._padding)
+#        phi = s + self.gamma * self.xp.abs(d) + self.eps
+#
+#        tmp = (d**2) / phi
+#
+#        if self._weights is not None:
+#            tmp *= self._weights
+#
+#        return float(self.xp.sum(tmp))
+#
+#    def _gradient(self, x: Array) -> Array:
+#        d, s = neighbor_difference_and_sum(x, self.xp, padding=self._padding)
+#        phi = s + self.gamma * self.xp.abs(d) + self.eps
+#
+#        tmp = d * (2 * phi - (d + self.gamma * self.xp.abs(d))) / (phi**2)
+#
+#        if self._weights is not None:
+#            tmp *= self._weights
+#
+#        return 2 * tmp.sum(axis=0)
+#
+#    def _approx_diag_hessian(self, x: Array) -> Array:
+#        d, s = neighbor_difference_and_sum(x, self.xp, padding=self._padding)
+#        phi = s + self.gamma * self.xp.abs(d) + self.eps
+#
+#        tmp = ((s - d + self.eps) ** 2) / (phi**3)
+#
+#        if self._weights is not None:
+#            tmp *= self._weights
+#
+#        return 4 * tmp.sum(axis=0)
 
 
 class L2DataFidelity(SmoothFunction):
@@ -1129,14 +1129,14 @@ def split_fwd_model(
 def rdp_preconditioner(
     x: Array,
     adjoint_ones: Array,
-    prior: SmoothFunctionWithApproxHessian,
+    prior,
     version: int = 1,
     delta: float = 1e-6,
 ) -> Array:
     if version == 1:
         precond = (x + delta) / adjoint_ones
     elif version == 2:
-        precond = (x + delta) / (adjoint_ones + prior.approx_diag_hessian(x) * x)
+        precond = (x + delta) / (adjoint_ones + prior.diag_hessian(x) * x)
     else:
         raise ValueError("precond_version must be 1 or 2")