From 412451987f2f1e80fa7cbed08406a1b1ab9bad8f Mon Sep 17 00:00:00 2001
From: Sam-XiaoyueLi <xiaoyue.li.samantha@gmail.com>
Date: Wed, 28 Feb 2024 17:15:09 +0800
Subject: [PATCH] Added documentation + test of effect of n_taylor

---
 .../dbi/dbi_strategy_magnetic_field.ipynb     | 83 +++++++++++++++++++
 src/qibo/models/dbi/double_bracket.py         |  3 +
 src/qibo/models/dbi/utils.py                  | 56 +++++++++++--
 3 files changed, 133 insertions(+), 9 deletions(-)

diff --git a/examples/dbi/dbi_strategy_magnetic_field.ipynb b/examples/dbi/dbi_strategy_magnetic_field.ipynb
index 40e46f422a..8ab8207500 100644
--- a/examples/dbi/dbi_strategy_magnetic_field.ipynb
+++ b/examples/dbi/dbi_strategy_magnetic_field.ipynb
@@ -300,6 +300,89 @@
     "plt.ylabel(r'$|| \\sigma(e^{sW}He^{-sW}) || $')\n",
     "plt.legend()"
    ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Effect of `n_taylor`"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# backend\n",
+    "set_backend(\"qibojit\", \"numba\")\n",
+    "# initialize dbi object\n",
+    "nqubits = 5\n",
+    "h0 = random_hermitian(2**nqubits, seed=2)\n",
+    "scheduling = DoubleBracketScheduling.hyperopt\n",
+    "mode = DoubleBracketGeneratorType.single_commutator\n",
+    "n_1 = 5\n",
+    "n_2 = 2\n",
+    "dbi_1 = DoubleBracketIteration(Hamiltonian(nqubits=nqubits, matrix=h0), scheduling=scheduling, mode=mode)\n",
+    "dbi_2 = DoubleBracketIteration(Hamiltonian(nqubits=nqubits, matrix=h0), scheduling=scheduling, mode=mode)\n",
+    "print(\"Initial off diagonal norm\", dbi_1.off_diagonal_norm)\n",
+    "visualize_matrix(dbi_1.h.matrix, title=f'Random hamiltonian with L={nqubits}')"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# generate the onsite Z operators\n",
+    "onsite_Z_ops = generate_onsite_Z_ops(nqubits)\n",
+    "d_coef = onsite_Z_decomposition(dbi.h.matrix, onsite_Z_ops)\n",
+    "d = sum([d_coef[i] * onsite_Z_ops[i] for i in range(nqubits)])\n",
+    "grad, s = gradient_onsite_Z(dbi,d,5, onsite_Z_ops)\n",
+    "print('The initial D coefficients:', d_coef)\n",
+    "print('Gradient:', grad)\n",
+    "print('s:', s)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "iters = 30\n",
+    "d_coef_1, d_1 = d_coef, d\n",
+    "d_coef_2, d_2 = d_coef, d\n",
+    "\n",
+    "off_diagonal_norm_1 = [dbi_1.off_diagonal_norm]\n",
+    "off_diagonal_norm_2 = [dbi_2.off_diagonal_norm]\n",
+    "s_step_1 = [0]\n",
+    "s_step_2 = [0]\n",
+    "for i in range(iters):\n",
+    "    s_1, d_coef_1, d_1 = gradient_descent_onsite_Z(dbi_1, d_coef_1, d_1, onsite_Z_ops=onsite_Z_ops, n_taylor=n_1, max_evals=100)\n",
+    "    s_2, d_coef_2, d_2 = gradient_descent_onsite_Z(dbi_2, d_coef_2, d_2, onsite_Z_ops=onsite_Z_ops, n_taylor=n_2, max_evals=100)\n",
+    "    dbi_1(step=s_1, d=d_1)\n",
+    "    dbi_2(step=s_2, d=d_2)\n",
+    "    off_diagonal_norm_1.append(dbi_1.off_diagonal_norm)\n",
+    "    off_diagonal_norm_2.append(dbi_2.off_diagonal_norm)\n",
+    "    s_step_1.append(s_1)\n",
+    "    s_step_2.append(s_2)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "plt.title(str(nqubits) + ' spins magnetic field diagonalization')\n",
+    "plt.plot(off_diagonal_norm_1, label=f'n_taylor={n_1}')\n",
+    "plt.plot(off_diagonal_norm_2, label=f'n_taylor={n_2}')\n",
+    "plt.legend()\n",
+    "plt.xlabel('Iteration')\n",
+    "plt.ylabel(r'$|| \\sigma(e^{sW}He^{-sW}) || $')"
+   ]
   }
  ],
  "metadata": {
diff --git a/src/qibo/models/dbi/double_bracket.py b/src/qibo/models/dbi/double_bracket.py
index e75fa16a21..46b8112712 100644
--- a/src/qibo/models/dbi/double_bracket.py
+++ b/src/qibo/models/dbi/double_bracket.py
@@ -280,6 +280,9 @@ def choose_step(
         scheduling: Optional[DoubleBracketScheduling] = None,
         **kwargs,
     ):
+        """
+        Calculate the optimal step using respective `scheduling` methods.
+        """
         if scheduling is None:
             scheduling = self.scheduling
         if scheduling is DoubleBracketScheduling.grid_search:
diff --git a/src/qibo/models/dbi/utils.py b/src/qibo/models/dbi/utils.py
index 3ac26d0225..d179d45a4d 100644
--- a/src/qibo/models/dbi/utils.py
+++ b/src/qibo/models/dbi/utils.py
@@ -187,10 +187,19 @@ def ds_di_onsite_Z(
     dbi_object: DoubleBracketIteration,
     d: np.array,
     i: int,
-    taylor_coef=None,
-    onsite_Z_ops=None,
+    taylor_coef: Optional[list] = None,
+    onsite_Z_ops: Optional[list] = None,
 ):
-    """Return the derivatives of the first 3 polynomial coefficients with respect to onsite Pauli-Z coefficients"""
+    r"""Return the derivatives of the first 3 polynomial coefficients with respect to onsite Pauli-Z coefficients\
+        Args:
+            dbi_object (DoubleBracketIteration): the target dbi object
+            d (np.array): the diagonal operator
+            i (int): the index of onsite-Z coefficient
+            taylor_coef (list): coefficients of `s` in the taylor expansion of math:`\\frac{\\partial ||\sigma(e^{sW}He^{-sW})||^2}{\\partial s}`, from the highest order to the lowest.
+            onsite_Z_ops (list): onsite Z operators of `dbi_object.h`
+        Returns:
+            floats da, db, dc, ds
+    """
     # generate the list of derivatives w.r.t ith Z operator coefficient
     nqubits = int(np.log2(d.shape[0]))
     if onsite_Z_ops is None:
@@ -227,11 +236,18 @@ def derivative_product(k1, k2):
 def gradient_onsite_Z(
     dbi_object: DoubleBracketIteration,
     d: np.array,
-    n_taylor=3,
+    n_taylor=2,
     onsite_Z_ops=None,
     use_ds=False,
 ):
-    """Calculate the gradient of loss function with respect to onsite Pauli-Z coefficients"""
+    r"""Calculate the gradient of loss function with respect to onsite Pauli-Z coefficients
+    Args:
+        dbi_object (DoubleBracketIteration): the target dbi object
+        d (np.array): the diagonal operator
+        n_taylor (int): the highest order of the taylore expansion of  w.r.t `s`
+        taylor_coef (list): coefficients of `s` in the taylor expansion of math:`\\frac{\\partial ||\sigma(e^{sW}He^{-sW})||^2}{\\partial s}`
+        use_ds (boolean): if False, ds is set to 0
+    """
     # n is the highest order for calculating s
 
     # initialize gradient
@@ -244,6 +260,7 @@ def gradient_onsite_Z(
         n=n_taylor,
         backup_scheduling=DoubleBracketScheduling.polynomial_approximation,
     )
+
     a, b, c = coef[len(coef) - 3 :]
     for i in range(nqubits):
         da, db, dc, ds = ds_di_onsite_Z(dbi_object, d, i, [a, b, c], onsite_Z_ops)
@@ -263,6 +280,7 @@ def gradient_onsite_Z(
 
 
 def onsite_Z_decomposition(h_matrix: np.array, onsite_Z_ops=None):
+    """finds the decomposition of hamiltonian `h_matrix` into Pauli-Z operators"""
     nqubits = int(np.log2(h_matrix.shape[0]))
     if onsite_Z_ops is None:
         onsite_Z_ops = generate_onsite_Z_ops(nqubits)
@@ -274,6 +292,7 @@ def onsite_Z_decomposition(h_matrix: np.array, onsite_Z_ops=None):
 
 
 def generate_onsite_Z_ops(nqubits):
+    """generate the list of Pauli-Z operators of an `nqubit` system in the form of np.array"""
     onsite_Z_str = ["I" * (i) + "Z" + "I" * (nqubits - i - 1) for i in range(nqubits)]
     onsite_Z_ops = [
         SymbolicHamiltonian(str_to_symbolic(Z_i_str)).dense.matrix
@@ -285,18 +304,37 @@ def generate_onsite_Z_ops(nqubits):
 def gradient_descent_onsite_Z(
     dbi_object: DoubleBracketIteration,
     d_coef: list,
-    d: np.array = None,
-    n_taylor: int = 3,
-    onsite_Z_ops=None,
+    d: Optional[np.array] = None,
+    n_taylor: int = 2,
+    onsite_Z_ops: Optional[list] = None,
     lr_min: float = 1e-5,
     lr_max: float = 1,
     max_evals: int = 100,
     space: callable = None,
     optimizer: callable = None,
-    look_ahead: int = 1,
     verbose: bool = False,
     use_ds: bool = True,
 ):
+    """calculate the elements of one gradient descent step on `dbi_object`.
+
+    Args:
+        dbi_object (DoubleBracketIteration): the target dbi object
+        d_coef (list): the initial decomposition of `d` into Pauli-Z operators
+        d (np.array, optional): the initial diagonal operator. Defaults to None.
+        n_taylor (int, optional): the highest order to expand the loss function derivative. Defaults to 2.
+        onsite_Z_ops (list, optional): list of onsite-Z operators. Defaults to None.
+        lr_min (float, optional): the minimal gradient step. Defaults to 1e-5.
+        lr_max (float, optional): the maximal gradient step. Defaults to 1.
+        max_evals (int, optional): the max number of evaluations for `hyperopt` to find the optimal gradient step `lr`. Defaults to 100.
+        space (callable, optional): the search space for `hyperopt`. Defaults to None.
+        optimizer (callable, optional): optimizer for `hyperopt`. Defaults to None.
+        verbose (bool, optional): option to print out the 'hyperopt' progress. Defaults to False.
+        use_ds (bool, optional): if False, ds is set to 0. Defaults to True.
+
+    Returns:
+        the optimal step found, coeffcients of `d` in Pauli-Z basis, matrix of `d`
+
+    """
     nqubits = int(np.log2(dbi_object.h.matrix.shape[0]))
     if onsite_Z_ops is None:
         onsite_Z_ops = generate_onsite_Z_ops(nqubits)