Source code for oqupy.gradient

# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
"""
Frontend for computing the gradient of some objective function w.r.t. some
control parameters.
"""
from typing import Callable, Dict, List, Optional, Text, Tuple, Union

import numpy as np
from numpy import ndarray
import tensornetwork as tn

from oqupy.system_dynamics import _compute_dynamics_input_parse, \
    _apply_system_superoperator, _apply_derivative_pt_mpos, _get_pt_mpos, \
    _get_pt_mpos_backprop, _get_caps, _apply_caps, _apply_pt_mpos
from oqupy.control import Control
from oqupy.dynamics import Dynamics
from oqupy.process_tensor import BaseProcessTensor
from oqupy.system import ParameterizedSystem
from oqupy.util import get_progress, check_isinstance

[docs]def state_gradient(
        system: ParameterizedSystem,
        initial_state: ndarray,
        target_derivative: Union[Callable, ndarray],
        process_tensors: List[BaseProcessTensor],
        parameters: ndarray,
        start_time: Optional[float] = 0.0,
        progress_type: Optional[Text] = None) -> Dict:
    """
    Compute system dynamics and gradient of an objective function Z with
    respect to a parameterized System for a given set of control
    parameters, accounting for the interaction with an environment described by
    process tensors. The target state corresponds to (dZ/drho_f).

    Parameters:
    -----------
    system: ParametrizedSystem
        Parameterized system taking M parameters.
    initial_state: ndarray
        The initial density matrix to propagate forwards
    target_derivative: Union[Callable, ndarray]
        A pure target state transposed or derivative w.r.t. an objective
        function.
    process_tensors: List[BaseProcessTensor]
        A list of process tensors (each with N time steps) representing the
        environment.
    parameters: ndarray
        A matrix of dimension 2N x M corresponding to the M parameters at each
        half time step.
    start_time: float
        Optional start time offset.
    progress_type: str (default = None)
        The progress report type during the computation. Types are:
        {``silent``, ``simple``, ``bar``}. If `None` then
        the default progress type is used.

    Returns:
    --------
    return_dict: Dict
        The return dictionary has the fields:
        'final_state' : the final state after evolving the initial state
        'gradprop' : derivatives of Z with respect to half-step propagators
        'gradient' : derivatives of Z with respect to the parameters
        'dynamics' : the dynamics of the system
    """
    check_isinstance(parameters, ndarray, 'parameters')

    num_steps = len(process_tensors[0])
    dt = process_tensors[0].dt
    num_parameters = parameters.shape[1]

    grad_prop, dynamics = compute_gradient_and_dynamics(
        system=system,
        initial_state=initial_state,
        target_derivative=target_derivative,
        process_tensors=process_tensors,
        parameters=parameters,
        start_time=start_time,
        dt=dt,
        num_steps=num_steps,
        progress_type=progress_type)


    get_half_props= system.get_propagators(dt,parameters)
    get_prop_derivatives = system.get_propagator_derivatives(dt,parameters)

    final_derivs = _chain_rule(
        adjoint_tensor=grad_prop,
        dprop_dparam=get_prop_derivatives,
        propagators=get_half_props,
        num_steps=num_steps,
        num_parameters=num_parameters,
        progress_type=progress_type)

    return_dict = {
        'final_state':dynamics.states[-1],
        'gradprop':grad_prop,
        'gradient':final_derivs,
        'dynamics':dynamics
    }

    return return_dict

def _chain_rule(
        adjoint_tensor:ndarray,
        dprop_dparam:Callable[[int], Tuple[ndarray,ndarray]],
        propagators:Callable[[int], Tuple[ndarray,ndarray]],
        num_steps:int,
        num_parameters:int,
        progress_type: Optional[Text] = None):

    def combine_derivs(
            target_deriv,
            pre_prop,
            post_prop):
        target_deriv = tn.Node(target_deriv)
        pre_node=tn.Node(pre_prop)
        post_node=tn.Node(post_prop)
        target_deriv[3] ^ post_node[1]
        target_deriv[2] ^ post_node[0]
        target_deriv[1] ^ pre_node[1]
        target_deriv[0] ^ pre_node[0]

        final_node = target_deriv @ pre_node \
                        @ post_node
        tensor = final_node.tensor

        return tensor

    total_derivs = np.zeros((2*num_steps,num_parameters),dtype='complex128')

    title = "--> Apply chain rule:"
    prog_bar = get_progress(progress_type)(num_steps, title)
    prog_bar.enter()

    for i in range(0,num_steps): # populating two elements each step

        first_half_prop, second_half_prop = propagators(i)
        first_half_prop_derivs,second_half_prop_derivs = dprop_dparam(i)

        prog_bar.update(i)

        for j in range(0,num_parameters):
            total_derivs[2*i][j] = combine_derivs(
                            adjoint_tensor[i],
                            first_half_prop_derivs[j].T,
                            second_half_prop.T)
            total_derivs[2*i+1][j] = combine_derivs(
                adjoint_tensor[i],
                first_half_prop.T,
                second_half_prop_derivs[j].T)

    prog_bar.update(num_steps)
    prog_bar.exit()

    return total_derivs


[docs]def compute_gradient_and_dynamics(
        system: ParameterizedSystem,
        initial_state: ndarray,
        target_derivative: Union[Callable,ndarray],
        process_tensors: List[BaseProcessTensor],
        parameters: ndarray,
        start_time: Optional[float] = 0.0,
        dt: Optional[float] = None,
        num_steps: Optional[int] = None,
        control: Optional[Control] = None,
        record_all: Optional[bool] = True,
        progress_type: Optional[Text] = None) -> Tuple[List, Dynamics]:
    """
    Compute some objective function and calculate its gradient w.r.t.
    some control parameters, accounting for interaction with an environment
    using one or more process tensors.

    Parameters:
    -----------
    system: ParametrizedSystem
        Parameterized system taking M parameters.
    initial_state: ndarray
        The initial density matrix to propagate forwards
    target_derivative: Union[Callable, ndarray]
        A pure target state transposed or derivative w.r.t. an objective
        function.
    process_tensors: List[BaseProcessTensor]
        A list of process tensors (each with N time steps) representing the
        environment.
    parameters: List[Tuple]
        A list of M-tuples with length 2N. Each tuple corresponds to the values
        of the parameters at a given half time step.
    start_time: float
        Optional start time offset.
    dt: float
        Length of a single time step.
    num_steps: int
        Optional number of time steps to be computed.
    control: Control
        Optional control operations.
    record_all: bool
        If `false` function only computes the final state.
    progress_type: str (default = None)
        The progress report type during the computation. Types are:
        {``silent``, ``simple``, ``bar``}. If `None` then
        the default progress type is used.

    Returns:
    --------
    propagator_derivatives: List[ndarray]
        List of 4-rank tensors. The nth entry corresponds to the derivative of
        the objective function with respect to a propagator at the nth
        time step. The axis are ordered as follows:
            * [0] : output leg of 2nd half-propagator from step (n-1)
            * [1] : input system leg of MPO from step n
            * [2] : output system leg of MPO from step n
            * [3] : input lef of 1st half-propagator from step (n+1)
    dynamics: Dynamics
        The system dynamics for the given system Hamiltonian
        (accounting for the interaction with the environment).
    """

    # -- input parsing --
    parsed_parameters = _compute_dynamics_input_parse(
        False, system, initial_state, dt, num_steps, start_time,
        process_tensors, control, record_all)
    system, initial_state, dt, num_steps, start_time, \
        process_tensors, control, record_all, hs_dim = parsed_parameters

    check_isinstance(system, ParameterizedSystem, "system")

    assert target_derivative is not None, \
        'target state must be given explicitly'

    num_envs = len(process_tensors)

    # -- prepare propagators --
    propagators = system.get_propagators(dt, parameters)

    # -- prepare controls --
    def controls(step: int):
        return control.get_controls(
            step,
            dt=dt,
            start_time=start_time)

    # ~~~~~~~~~~~~~~~~~~~~~~~~~~~~
    # ~~~~ Forwardpropagation ~~~~
    # ~~~~~~~~~~~~~~~~~~~~~~~~~~~~

    # -- initialize computation --
    #
    #  Initial state including the bond legs to the environments with:
    #    edges 0, 1, .., num_envs-1    are the bond legs of the environments
    #    edge  -1                      is the state leg
    initial_ndarray = initial_state.reshape(hs_dim**2)
    initial_ndarray.shape = tuple([1]*num_envs+[hs_dim**2])
    current_node = tn.Node(initial_ndarray)
    current_edges = current_node[:]

    states = []
    title = "--> Compute forward propagation:"
    prog_bar = get_progress(progress_type)(num_steps, title)
    prog_bar.enter()

    forwardprop_derivs_list = []
    mpo_list=[]

    for step in range(num_steps+1):

        # -- apply pre measurement control --
        pre_measurement_control, post_measurement_control = controls(step)

        if pre_measurement_control is not None:
            current_node, current_edges = _apply_system_superoperator(
                current_node, current_edges, pre_measurement_control)

        if step == num_steps:
            break

        # -- extract current state -- update field --
        if record_all:
            caps = _get_caps(process_tensors, step)
            state_tensor = _apply_caps(current_node, current_edges, caps)
            state = state_tensor.reshape(hs_dim, hs_dim)
            states.append(state)

        prog_bar.update(step)

        # -- apply post measurement control --
        if post_measurement_control is not None:
            current_node, current_edges = _apply_system_superoperator(
                current_node, current_edges, post_measurement_control)

        forwardprop_derivs_list.append(tn.replicate_nodes([current_node])[0])

        # -- propagate one time step --
        first_half_prop, second_half_prop = propagators(step)

        pt_mpos = _get_pt_mpos(process_tensors, step)
        mpo_list.append(pt_mpos)

        current_node, current_edges = _apply_system_superoperator(
            current_node, current_edges, first_half_prop)
        current_node, current_edges = _apply_pt_mpos(
            current_node, current_edges, pt_mpos)

        current_node, current_edges = _apply_system_superoperator(
            current_node, current_edges, second_half_prop)

    # -- extract last state --
    caps = _get_caps(process_tensors, num_steps)
    state_tensor = _apply_caps(current_node, current_edges, caps)
    final_state = state_tensor.reshape(hs_dim, hs_dim)
    states.append(final_state)

    prog_bar.update(num_steps)
    prog_bar.exit()

    # -- create dynamics object --
    if record_all:
        times = start_time + np.arange(len(states))*dt
    else:
        times = [start_time + len(states)*dt]

    dynamics = Dynamics(times=list(times),states=states)

    # ~~~~~~~~~~~~~~~~~~~~~~~~~~~~
    # ~~~~~ Backpropagation ~~~~~~
    # ~~~~~~~~~~~~~~~~~~~~~~~~~~~~

    # -- initialize computation (except backwards) --
    #
    #  Initial state including the bond legs to the environments with:
    #    edges 0, 1, .., num_envs-1    are the bond legs of the environments
    #    edge  -1                      is the state leg

    title = "--> Compute backward propagation:"
    prog_bar = get_progress(progress_type)(num_steps, title)
    prog_bar.enter()

    if callable(target_derivative):
        target_derivative=target_derivative(states[-1])


    target_ndarray = target_derivative
    target_ndarray = target_ndarray.reshape(hs_dim**2)
    target_ndarray.shape = tuple([1]*num_envs+[hs_dim**2])
    current_node = tn.Node(target_ndarray)
    current_edges = current_node[:]

    combined_deriv_list = []

    pre_measurement_control, post_measurement_control=controls(num_steps)

    if pre_measurement_control is not None:
        current_node, current_edges = _apply_system_superoperator(
                current_node, current_edges, pre_measurement_control.T)

    forwardprop_tensor = forwardprop_derivs_list[num_steps-1]

    pt_mpos = mpo_list[num_steps-1]
    backprop_tensor = tn.replicate_nodes([current_node])[0]

    fwd_edges = forwardprop_tensor[:]
    deriv_forwardprop_tensor, fwd_edges = _apply_derivative_pt_mpos(
        forwardprop_tensor,fwd_edges,pt_mpos)

    for i, _ in enumerate(pt_mpos):
        fwd_edges[i] ^ backprop_tensor[i]

    deriv = deriv_forwardprop_tensor @ backprop_tensor

    combined_deriv_list.append(tn.replicate_nodes([deriv])[0])

    for loop, step in enumerate(reversed(range(1,num_steps))):

        prog_bar.update(loop)

        # -- now the backpropagation part --
        pre_measurement_control, post_measurement_control = controls(step)
        first_half_prop, second_half_prop = propagators(step)
        pt_mpos = _get_pt_mpos_backprop(mpo_list, step)

        current_node, current_edges = _apply_system_superoperator(
            current_node, current_edges, second_half_prop.T)

        current_node, current_edges = _apply_pt_mpos(
            current_node, current_edges, pt_mpos)

        current_node, current_edges = _apply_system_superoperator(
            current_node, current_edges, first_half_prop.T)

        if post_measurement_control is not None:
            current_node, current_edges = _apply_system_superoperator(
                current_node, current_edges, post_measurement_control.T)

        if pre_measurement_control is not None:
            current_node, current_edges = _apply_system_superoperator(
                current_node, current_edges, pre_measurement_control.T)

        forwardprop_tensor = forwardprop_derivs_list[step-1]

        backprop_tensor =  tn.replicate_nodes([current_node])[0]

        pt_mpos = mpo_list[step-1]

        fwd_edges = forwardprop_tensor[:]
        deriv_forwardprop_tensor,fwd_edges = _apply_derivative_pt_mpos(
            forwardprop_tensor,fwd_edges,pt_mpos)

        for i, _ in enumerate(pt_mpos):
            fwd_edges[i] ^ backprop_tensor[i]

        deriv = deriv_forwardprop_tensor @ backprop_tensor

        combined_deriv_list.append(deriv.get_tensor())
        # ordering of axis:
        # deriv[0] : output leg of 2nd half-propagator from step (n-1)
        # deriv[1] : input system leg of MPO from step n
        # deriv[2] : output system leg of MPO from step n
        # deriv[3] : input lef of 1st half-propagator from step (n+1)

    propagator_derivatives = list(reversed(combined_deriv_list))

    prog_bar.update(num_steps)
    prog_bar.exit()

    return propagator_derivatives, dynamics