Source code for krotov.functionals

r"""Functionals and `chi_constructor` routines.

Any `chi_constructor` routine passed to :func:`.optimize_pulses` must take the
following keyword-arguments:

    * `fw_states_T` (:class:`list` of :class:`~qutip.Qobj`): The list of
      states resulting from the forward-propagation of each
      :attr:`.Objective.initial_state` under the guess pulses of the current
      iteration (the optimized pulses of the previous iteration)

    * `objectives` (:class:`list` of :class:`.Objective`): A list of the
      optimization objectives.

    * `tau_vals` (:class:`list` of :class:`complex` or :obj:`None`): The
      overlaps of the :attr:`.Objective.target` and the corresponding
      `fw_states_T`, assuming :attr:`.Objective.target` contains a
      quantum state. If the objective defines no target state, a list of Nones

Krotov's method does not have an explicit dependence on the optimization
functional. It only enters through the `chi_constructor` which calculates the
boundary condition for the backward propagation, that is, the states


.. math::

   \Ket{\chi_k^{(i)}(T)}
      = - \left.\frac{\partial J_T}
        {\partial \Bra{\phi_k}}
        \right\vert_{\phi^{(i)}(T)}

for functionals defined in Hilbert space, or

.. math::

   \Op{\chi}_k^{(i)}(T)
      = - \left.\frac{\partial J_T}
        {\partial \langle\!\langle\Op{\rho}_k\vert}
        \right\vert_{\rho^{(i)}(T)}

in Liouville space, using the abstract
Hilbert-Schmidt notation :math:`\langle\!\langle a \vert b \rangle\!\rangle
\equiv \tr[a^\dagger b]`.
Passing a specific `chi_constructor` results in the minimization of the final
time functional from which that `chi_constructor` was derived.

The functions in this module that evaluate functionals are intended for use
inside a function that is passed as an `info_hook` to :func:`.optimize_pulses`.
Thus, they calculate $J_T$ from the same keyword arguments as the `info_hook`.
The values for $J_T$ may be used in a convergence analysis, see
:mod:`krotov.convergence`.
"""
import logging

import numpy as np
import qutip

from .second_order import _overlap


__all__ = [
    'f_tau',
    'F_ss',
    'J_T_ss',
    'chis_ss',
    'F_sm',
    'J_T_sm',
    'chis_sm',
    'F_re',
    'J_T_re',
    'chis_re',
    'J_T_hs',
    'chis_hs',
    'F_avg',
    'gate',
    'mapped_basis',
]


[docs]def f_tau(fw_states_T, objectives, tau_vals=None, **kwargs): r"""Average complex overlaps of the target states with the `fw_states_T`. That is, .. math:: f_{\tau} = \frac{1}{N} \sum_{k=1}^{N} w_k \tau_k where $\tau_k$ are the elements of `tau_vals`, assumed to be .. math:: \tau_k = \Braket{\Psi_k^{\tgt}}{\Psi_k(T)}, in Hilbert space, or .. math:: \tau_k = \tr\left[\Op{\rho}_k^{\tgt\,\dagger}\Op{\rho}_k(T)\right] in Liouville space, where $\ket{\Psi_k}$ or $\Op{\rho}_k$ are the elements of `fw_states_T`, and $\ket{\Psi_k^{\tgt}}$ or $\Op{\rho}^{\tgt}$ are the target states from the :attr:`~.Objective.target` attribute of the objectives. If `tau_vals` are None, they will be calculated internally. $N$ is the number of objectives, and $w_k$ is an optional weight for each objective. For any objective that has a (custom) `weight` attribute, the $w_k$ is taken from that attribute; otherwise, $w_k = 1$. The weights, if present, are not automatically normalized, they are assumed to have values such that the resulting $f_{\tau}$ lies in the unit circle of the complex plane. Usually, this means that the weights should sum to $N$. The exception would be for mixed target states, where the weights should compensate for the non-unit purity. The problem may be circumvented by using :func:`J_T_hs` for mixed target states. The `kwargs` are ignored, allowing the function to be used in an `info_hook`. """ if tau_vals is None: tau_vals = [ _overlap(obj.target, psi) for (psi, obj) in zip(fw_states_T, objectives) ] res = 0j for (obj, τ) in zip(objectives, tau_vals): if τ is None: logger = logging.getLogger('krotov') logger.warning("τ is None in f_tau") continue if hasattr(obj, 'weight'): res += obj.weight * τ else: res += τ return res / len(objectives)
[docs]def F_ss(fw_states_T, objectives, tau_vals=None, **kwargs): r"""State-to-state phase-insensitive fidelity .. math:: F_{\text{ss}} = \frac{1}{N} \sum_{k=1}^{N} w_k \Abs{\tau_k}^2 \quad\in [0, 1] with $N$, $w_k$ and $\tau_k$ as in :func:`f_tau`. The `kwargs` are ignored, allowing the function to be used in an `info_hook`. """ if tau_vals is None: # get the absolute square, analogously to the f_tau function above tau_vals_abssq = [ abs(_overlap(obj.target, psi)) ** 2 for (psi, obj) in zip(fw_states_T, objectives) ] else: tau_vals_abssq = [abs(tau) ** 2 for tau in tau_vals] F = f_tau(fw_states_T, objectives, tau_vals_abssq) assert abs(F.imag) < 1e-10, F.imag return F.real
[docs]def J_T_ss(fw_states_T, objectives, tau_vals=None, **kwargs): r"""State-to-state phase-insensitive functional $J_{T,\text{ss}}$ .. math:: J_{T,\text{ss}} = 1 - F_{\text{ss}} \quad\in [0, 1]. All arguments are passed to :func:`F_ss`. """ return 1 - F_ss(fw_states_T, objectives, tau_vals)
[docs]def chis_ss(fw_states_T, objectives, tau_vals): r"""States $\ket{\chi_k}$ for functional $J_{T,\text{ss}}$ .. math:: \Ket{\chi_k} = -\frac{\partial J_{T,\text{ss}}}{\partial \bra{\Psi_k(T)}} = \frac{1}{N} w_k \tau_k \Ket{\Psi^{\tgt}_k} with $\tau_k$ and $w_k$ as defined in :func:`f_tau`. """ N = len(objectives) res = [] for (obj, τ) in zip(objectives, tau_vals): # `obj.target` is assumed to be the "target state" (gate applied to # `initial_state`) if hasattr(obj, 'weight'): res.append((τ / N) * obj.weight * obj.target) else: res.append((τ / N) * obj.target) return res
[docs]def F_sm(fw_states_T, objectives, tau_vals=None, **kwargs): r"""Square-modulus fidelity .. math:: F_{\text{sm}} = \Abs{f_{\tau}}^2 \quad\in [0, 1]. All arguments are passed to :func:`f_tau` to evaluate $f_{\tau}$. """ return abs(f_tau(fw_states_T, objectives, tau_vals)) ** 2
[docs]def J_T_sm(fw_states_T, objectives, tau_vals=None, **kwargs): r"""Square-modulus functional $J_{T,\text{sm}}$ .. math:: J_{T,\text{sm}} = 1 - F_{\text{sm}} \quad\in [0, 1] All arguments are passed to :func:`f_tau` while evaluating $F_{\text{sm}}$ in :func:`F_sm`. """ return 1 - F_sm(fw_states_T, objectives, tau_vals)
[docs]def chis_sm(fw_states_T, objectives, tau_vals): r"""States $\ket{\chi_k}$ for functional $J_{T,\text{sm}}$ .. math:: \Ket{\chi_k} = -\frac{\partial J_{T,\text{sm}}}{\partial \bra{\Psi_k(T)}} = \frac{1}{N^2} w_k \sum_{j}^{N} w_j\tau_j\Ket{\Psi^{\tgt}_k} with optional weights $w_k$, cf. :func:`f_tau` (default: :math:`w_k=1`). If given, the weights should generally sum to $N$. """ sum_of_w_tau = 0 for (obj, τ) in zip(objectives, tau_vals): if hasattr(obj, 'weight'): sum_of_w_tau += obj.weight * τ else: sum_of_w_tau += τ c = 1.0 / (len(objectives)) ** 2 res = [] for obj in objectives: # `obj.target` is assumed to be the "target state" (gate applied to # `initial_state`) if hasattr(obj, 'weight'): res.append(c * obj.weight * obj.target * sum_of_w_tau) else: res.append(c * obj.target * sum_of_w_tau) return res
[docs]def F_re(fw_states_T, objectives, tau_vals=None, **kwargs): r"""Real-part fidelity .. math:: F_{\text{re}} = \Re[f_{\tau}] \quad\in \begin{cases} [-1, 1] & \text{in Hilbert space} \\ [0, 1] & \text{in Liouville space.} \end{cases} All arguments are passed to :func:`f_tau` to evaluate $f_{\tau}$. """ return f_tau(fw_states_T, objectives, tau_vals).real
[docs]def J_T_re(fw_states_T, objectives, tau_vals=None, **kwargs): r"""Real-part functional $J_{T,\text{re}}$ .. math:: J_{T,\text{re}} = 1 - F_{\text{re}} \quad\in \begin{cases} [0, 2] & \text{in Hilbert space} \\ [0, 1] & \text{in Liouville space.} \end{cases} All arguments are passed to :func:`f_tau` while evaluating $F_{\text{re}}$ in :func:`F_re`. Note: If the target states are mixed, $J_{T,\text{re}}$ may take negative values (for `fw_states_T` that are "in the right direction", but more pure than the target states). In this case, you may consider using :func:`J_T_hs`. """ return 1 - F_re(fw_states_T, objectives, tau_vals)
[docs]def chis_re(fw_states_T, objectives, tau_vals): r"""States $\ket{\chi_k}$ for functional $J_{T,\text{re}}$ .. math:: \Ket{\chi_k} = -\frac{\partial J_{T,\text{re}}}{\partial \bra{\Psi_k(T)}} = \frac{1}{2N} w_k \Ket{\Psi^{\tgt}_k} with optional weights $w_k$, cf. :func:`f_tau` (default: :math:`w_k=1`). If given, the weights should generally sum to $N$. Note: `tau_vals` are ignored, but are present to satisfy the requirments of the `chi_constructor` interface. """ c = 1.0 / (2 * len(objectives)) res = [] for obj in objectives: # `obj.target` is assumed to be the "target state" (gate applied to # `initial_state`) if hasattr(obj, 'weight'): res.append(c * obj.weight * obj.target) else: res.append(c * obj.target) return res
[docs]def J_T_hs(fw_states_T, objectives, tau_vals=None, **kwargs): r"""Hilbert-Schmidt distance measure functional $J_{T,\text{hs}}$ .. math:: J_{T,\text{hs}} = \frac{1}{2N} \sum_{k=1}^{N} w_k \Norm{\Op{\rho}_k(T) - \Op{\rho}_k^{\tgt}}_{\text{hs}}^2 \quad \in \begin{cases} [0, 2] & \text{in Hilbert space} \\ [0, 1] & \text{in Liouville space} \end{cases} in Liouville space (using the Hilbert-Schmidt norm), or equivalently with $\ket{\Psi_k(T)}$ and $\ket{\Psi_k^{tgt}}$ in Hilbert space. The functional is evaluated as .. math:: J_{T,\text{hs}} = \frac{1}{2N} \sum_{k=1}^{N} w_k \left( \Norm{\Op{\rho}_k(T)}_{\text{hs}}^2 + \Norm{\Op{\rho}^{\tgt}}_{\text{hs}}^2 - 2 \Re[\tau_k] \right) where the $\Op{\rho}_k$ are the elements of `fw_states_T`, the $\Op{\rho}_k^{\tgt}$ are the target states from the :attr:`~.Objective.target` attribute of the objectives, and the $\tau_k$ are the elements of `tau_vals` (which will be calculated internally if passed as None). The $w_k$ are optional weights, cf. :func:`f_tau`. If given, the weights should generally sum to $N$. The `kwargs` are ignored, allowing the function to be used in an `info_hook`. Note: For pure states (or Hilbert space states), $J_{T,\text{hs}}$ is equivalent to $J_{T,\text{re}}$, cf. :func:`J_T_re`. However, the backward-propagated states $\chi_k$ obtained from the two functionals (:func:`chis_re` and :func:`chis_hs`) are *not* equivalent. This may result in a vastly different optimization landscape that requires a significantly different value of the $\lambda_a$ value that regulates the overall magnitude of the pulse updates (given in `pulse_options` in :func:`.optimize_pulses`). """ if tau_vals is None: tau_vals = [ _overlap(obj.target, psi) for (psi, obj) in zip(fw_states_T, objectives) ] res = 0.0 hs = 'l2' # qutip's name for HS-norm for state vectors if fw_states_T[0].type == 'oper': hs = 'fro' # qutip's name for HS-norm for density matrices for (obj, ρ, τ) in zip(objectives, fw_states_T, tau_vals): ρ_tgt = obj.target if hasattr(obj, 'weight'): res += obj.weight * ( ρ.norm(hs) ** 2 + ρ_tgt.norm(hs) ** 2 - 2 * τ.real ) else: res += ρ.norm(hs) ** 2 + ρ_tgt.norm(hs) ** 2 - 2 * τ.real return res / (2 * len(objectives))
[docs]def chis_hs(fw_states_T, objectives, tau_vals): r"""States $\Op{\chi}_k$ for functional $J_{T,\text{hs}}$ .. math:: \Op{\chi}_k = -\frac{\partial J_{T,\text{sm}}} {\partial \langle\!\langle \Op{\rho}_k(T)\vert} = \frac{1}{2N} w_k \left(\Op{\rho}^{\tgt}_k - \Op{\rho}_k(T)\right) with optional weights $w_k$, cf. :func:`f_tau` (default: :math:`w_k=1`). This is derived from $J_{T,\text{hs}}$ rewritten in the abstract Hilbert-Schmidt notation :math:`\langle\!\langle a \vert b \rangle\!\rangle \equiv \tr[a^\dagger b]`: .. math:: J_{T,\text{hs}} = \frac{-1}{2N} \sum_{k=1}^{N} w_k \big( \underbrace{ \langle\!\langle \Op{\rho}_k(T) \vert \Op{\rho}_k^{\tgt} \rangle\!\rangle + \langle\!\langle \Op{\rho}_k^{\tgt}\vert \Op{\rho}_k(T) \rangle\!\rangle }_{=2\Re[\tau_k]} - \underbrace{ \langle\!\langle \Op{\rho}_k(T) \vert \Op{\rho}_k(T) \rangle\!\rangle }_{=\Norm{\Op{\rho}_k(T)}_{\text{hs}}^2} - \underbrace{ \langle\!\langle \Op{\rho}_k^{\tgt} \vert \Op{\rho}_k^{\tgt} \rangle\!\rangle }_{=\Norm{\Op{\rho}^{\tgt}}_{\text{hs}}^2} \big). Note: `tau_vals` are ignored, but are present to satisfy the requirments of the `chi_constructor` interface. """ c = 1.0 / (2 * len(objectives)) res = [] for (obj, ρ) in zip(objectives, fw_states_T): ρ_tgt = obj.target if hasattr(obj, 'weight'): w = obj.weight res.append(c * w * (ρ_tgt - ρ)) else: res.append(c * (ρ_tgt - ρ)) return res
[docs]def F_avg( fw_states_T, basis_states, gate, mapped_basis_states=None, prec=1e-5 ): r"""Average gate fidelity .. math:: F_{\text{avg}} = \int \big\langle \Psi \big\vert \Op{O}^\dagger \DynMap[\ketbra{\Psi}{\Psi}] \Op{O} \big\vert \Psi \big\rangle \dd \Psi where $\Op{O}$ is the target `gate`, and $\DynMap$ represents the dynamical map from time zero to $T$. In Liouville space, this is numerically evaluated as .. math:: F_{\text{avg}} = \frac{1}{N (N+1)} \sum_{i,j=1}^N \left( \big\langle \phi_i \big\vert \Op{O}^\dagger \Op{\rho}_{ij} \Op{O} \big\vert \phi_j \big\rangle + \big\langle \phi_i \big\vert \Op{O}^\dagger \Op{\rho}_{jj} \Op{O} \big\vert \phi_i \big\rangle \right), where :math:`\ket{\phi_i}` is the :math:`i`'th element of `basis_states`, and :math:`\Op{\rho}_{ij}` is the :math:`(i-1) N + j`'th element of `fw_states_T`, that is, :math:`\Op{\rho}_{ij} = \DynMap[\ketbra{\phi_i}{\phi_j}]`, with :math:`N` the dimension of the Hilbert space. In Hilbert space (unitary dynamics), this simplifies to .. math:: F_{\text{avg}} = \frac{1}{N (N+1)} \left( \Abs{\tr\left[\Op{O}^\dagger \Op{U}\right]}^2 + \tr\left[\Op{O}^\dagger \Op{U} \Op{U}^\dagger \Op{O}\right] \right), where $\Op{U}$ the gate that maps `basis_states` to the result of a forward propagation of those basis states, stored in `fw_states_T`. Args: fw_states_T (list[qutip.Qobj]): The forward propagated states. For dissipative dynamics, this must be the forward propagation of the full basis of Liouville space, that is, all $N^2$ dyadic combinations of the Hilbert space logical basis states. For unitary dynamics, the $N$ forward-propagated `basis_states`. basis_states (list[qutip.Qobj]): The $N$ Hilbert space logical basis states gate (qutip.Qobj): The $N \times N$ quantum gate in the logical subspace, e.g. :func:`qutip.qip.gates.cnot()`. mapped_basis_states (None or list[qutip.Qobj]): If given, the result of applying gate to `basis_states`. If not given, this will be calculated internally via :func:`mapped_basis`. It is recommended to pass pre-calculated `mapped_basis_states` when evaluating $F_{\text{avg}}$ repeatedly for the same target. prec (float): assert that the fidelity is correct at least up to the given precision. Mathematically, $F_{\text{avg}}$ is a real value. However, errors in the `fw_states_T` can lead to a small non-zero imaginary part. We assert that this imaginary part is below `prec`. """ # F_avg is not something you can optimize directly: Nobody has calculated # ∂(1-F_avg)/∂⟨ϕ|. This is why there is no J_T_avg, and why F_avg does not # follow the info_hook interface. N = len(basis_states) if gate.shape != (N, N): raise ValueError( "Shape of gate is incompatible with number of basis states" ) if fw_states_T[0].type == 'oper': if len(fw_states_T) != N * N: raise ValueError( "Evaluating F_avg for density matrices requires %d states " "(forward-propagation of all dyadic combinations of " "%d basis states), not %d" % (N * N, N, len(fw_states_T)) ) return _F_avg_rho( fw_states_T, basis_states, gate, mapped_basis_states, imag_limit=prec, ) elif fw_states_T[0].type == 'ket': if len(fw_states_T) != N: raise ValueError( "Evaluating F_avg for hilbert space states requires %d states " "(forward-propagation of all basis states), not %d" % (N, len(fw_states_T)) ) return _F_avg_psi(fw_states_T, basis_states, gate, imag_limit=prec) else: raise ValueError("Invalid type of state: %s" % fw_states_T[0].type)
def _F_avg_rho( fw_states_T, basis_states, gate, mapped_basis_states, imag_limit=1e-10 ): """Implementation of F_avg in Liouville space""" if mapped_basis_states is None: mapped_basis_states = mapped_basis(gate, basis_states) N = len(basis_states) F = 0 for j in range(N): ρ_jj = fw_states_T[j * N + j] # zero-based indices! Oϕ_j = mapped_basis_states[j] for i in range(N): ρ_ij = fw_states_T[i * N + j] # zero-based indices! Oϕ_i = mapped_basis_states[i] F += _overlap(Oϕ_i, ρ_ij(Oϕ_j)) + _overlap(Oϕ_i, ρ_jj(Oϕ_i)) assert abs(F.imag) < imag_limit, "%.2e > %.2e" % (F.imag, imag_limit) return F.real / (N * (N + 1)) def _F_avg_psi(fw_states_T, basis_states, O, imag_limit=1e-10): """Implementation of F_avg in Hilbert space""" N = len(basis_states) U = gate(basis_states, fw_states_T) F = abs((O.dag() * U).tr()) ** 2 + (O.dag() * U * U.dag() * O).tr() assert abs(F.imag) < imag_limit, "%.2e > %.2e" % (F.imag, imag_limit) return F.real / (N * (N + 1))
[docs]def gate(basis_states, fw_states_T): """Gate that maps `basis_states` to `fw_states_T` Example: >>> from qutip import ket >>> basis = [ket(nums) for nums in [(0, 0), (0, 1), (1, 0), (1, 1)]] >>> fw_states_T = mapped_basis(qutip.gates.cnot(), basis) >>> U = gate(basis, fw_states_T) >>> assert (U - qutip.gates.cnot()).norm() < 1e-15 """ N = len(basis_states) U = np.zeros((N, N), dtype=np.complex128) for j in range(N): for i in range(N): U[i, j] = basis_states[i].overlap(fw_states_T[j]) dims = [basis_states[0].dims[0], fw_states_T[0].dims[0]] return qutip.Qobj(U, dims=dims)
[docs]def mapped_basis(O, basis_states): """Result of applying the gate `O` to `basis_states` Example: >>> from qutip import ket >>> basis = [ket(nums) for nums in [(0, 0), (0, 1), (1, 0), (1, 1)]] >>> states = mapped_basis(qutip.gates.cnot(), basis) >>> assert (states[0] - ket((0, 0))).norm() < 1e-15 >>> assert (states[1] - ket((0, 1))).norm() < 1e-15 >>> assert (states[2] - ket((1, 1))).norm() < 1e-15 # swap (1, 1) ... >>> assert (states[3] - ket((1, 0))).norm() < 1e-15 # ... and (1, 0) """ return tuple( [ sum( [complex(O[i, j]) * basis_states[i] for i in range(O.shape[0])] ) for j in range(O.shape[1]) ] )