Source code for pennylane.gradients.adjoint_metric_tensor

# Copyright 2018-2021 Xanadu Quantum Technologies Inc.

# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at

#     http://www.apache.org/licenses/LICENSE-2.0

# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
"""
Contains the adjoint_metric_tensor.
"""
from functools import partial
from itertools import chain

import numpy as np

import pennylane as qml

# pylint: disable=too-many-statements,unused-argument
from pennylane.gradients.metric_tensor import _contract_metric_tensor_with_cjac
from pennylane.tape import QuantumScript, QuantumScriptBatch
from pennylane.transforms import transform
from pennylane.typing import PostprocessingFn


def _reshape_real_imag(state, dim):
    state = qml.math.reshape(state, (dim,))
    return qml.math.real(state), qml.math.imag(state)


def _group_operations(tape):
    """Divide all operations of a tape into trainable operations and blocks
    of untrainable operations after each trainable one."""

    # Extract tape operations list
    ops = tape.operations
    # Find the indices of trainable operations in the tape operations list
    # pylint: disable=protected-access
    trainable_par_info = [tape.par_info[i] for i in tape.trainable_params]
    trainables = [info["op_idx"] for info in trainable_par_info]
    # Add the indices incremented by one to the trainable indices
    split_ids = list(chain.from_iterable([idx, idx + 1] for idx in trainables))

    # Split at trainable and incremented indices to get groups after trainable
    # operations and single trainable operations (in alternating order)
    all_groups = np.split(ops, split_ids)

    # Collect trainable operations and groups after trainable operations
    # the first set of non-trainable ops are the ops "after the -1st" trainable op
    group_after_trainable_op = dict(enumerate(all_groups[::2], start=-1))
    trainable_operations = list(chain.from_iterable(all_groups[1::2]))

    return trainable_operations, group_after_trainable_op


def _expand_trainable_multipar(
    tape: QuantumScript,
) -> tuple[QuantumScriptBatch, PostprocessingFn]:
    """Expand trainable multi-parameter operations in a quantum tape."""

    interface = qml.math.get_interface(*tape.get_parameters())
    use_tape_argnum = interface == "jax"
    expand_fn = qml.transforms.create_expand_trainable_multipar(
        tape, use_tape_argnum=use_tape_argnum
    )
    return [expand_fn(tape)], lambda x: x[0]


[docs]@partial( transform, expand_transform=_expand_trainable_multipar, classical_cotransform=_contract_metric_tensor_with_cjac, is_informative=True, use_argnum_in_expand=True, ) def adjoint_metric_tensor( tape: QuantumScript, ) -> tuple[QuantumScriptBatch, PostprocessingFn]: r"""Implements the adjoint method outlined in `Jones <https://arxiv.org/abs/2011.02991>`__ to compute the metric tensor. A forward pass followed by intermediate partial backwards passes are used to evaluate the metric tensor in :math:`\mathcal{O}(p^2)` operations, where :math:`p` is the number of trainable operations, using 4 state vectors. .. note:: The adjoint metric tensor method has the following restrictions: * Currently only ``"default.qubit"`` with ``shots=None`` is supported. * We assume the circuit to be composed of unitary gates only and rely on the ``generator`` property of the gates to be implemented. Note also that this makes the metric tensor strictly real-valued. Args: tape (QNode or QuantumTape): Circuit to compute the metric tensor of Returns: qnode (QNode) or tuple[List[QuantumTape], function]: The transformed circuit as described in :func:`qml.transform <pennylane.transform>`. Executing this circuit will provide the metric tensor in the form of a tensor. Dimensions are ``(tape.num_params, tape.num_params)``. .. seealso:: :func:`~.metric_tensor` for hardware-compatible metric tensor computations. **Example** Consider the following QNode: .. code-block:: python dev = qml.device("default.qubit", wires=3) @qml.qnode(dev, interface="autograd") def circuit(weights): qml.RX(weights[0], wires=0) qml.RY(weights[1], wires=0) qml.CNOT(wires=[0, 1]) qml.RZ(weights[2], wires=1) qml.RZ(weights[3], wires=0) return qml.expval(qml.Z(0) @ qml.Z(1)), qml.expval(qml.Y(1)) We can use the ``adjoint_metric_tensor`` transform to generate a new function that returns the metric tensor of this QNode: >>> mt_fn = qml.adjoint_metric_tensor(circuit) >>> weights = np.array([0.1, 0.2, 0.4, 0.5], requires_grad=True) >>> mt_fn(weights) tensor([[ 0.25 , 0. , -0.0497, -0.0497], [ 0. , 0.2475, 0.0243, 0.0243], [-0.0497, 0.0243, 0.0123, 0.0123], [-0.0497, 0.0243, 0.0123, 0.0123]], requires_grad=True) This approach has the benefit of being significantly faster than the hardware-ready ``metric_tensor`` function: >>> import time >>> start_time = time.process_time() >>> mt = mt_fn(weights) >>> time.process_time() - start_time 0.019 >>> mt_fn_2 = qml.metric_tensor(circuit) >>> start_time = time.process_time() >>> mt = mt_fn_2(weights) >>> time.process_time() - start_time 0.025 This speedup becomes more drastic for larger circuits. The drawback of the adjoint method is that it is only available on simulators and without shot simulations. """ def processing_fn(tapes): tape = tapes[0] if tape.shots: raise ValueError( "The adjoint method for the metric tensor is only implemented for shots=None" ) if set(tape.wires) != set(range(tape.num_wires)): wire_map = {w: i for i, w in enumerate(tape.wires)} tapes, fn = qml.map_wires(tape, wire_map) tape = fn(tapes) # Divide all operations of a tape into trainable operations and blocks # of untrainable operations after each trainable one. trainable_operations, group_after_trainable_op = _group_operations(tape) dim = 2**tape.num_wires # generate and extract initial state prep = tape[0] if len(tape) > 0 and isinstance(tape[0], qml.operation.StatePrep) else None interface = qml.math.get_interface(*tape.get_parameters(trainable_only=False)) psi = qml.devices.qubit.create_initial_state(tape.wires, prep, like=interface) # initialize metric tensor components (which all will be real-valued) like_real = qml.math.real(psi[0]) L = qml.math.convert_like(qml.math.zeros((tape.num_params, tape.num_params)), like_real) T = qml.math.convert_like(qml.math.zeros((tape.num_params,)), like_real) for op in group_after_trainable_op[-1][int(prep is not None) :]: psi = qml.devices.qubit.apply_operation(op, psi) for j, outer_op in enumerate(trainable_operations): generator_1, prefactor_1 = qml.generator(outer_op) # the state vector phi is missing a factor of 1j * prefactor_1 phi = qml.devices.qubit.apply_operation(generator_1, psi) phi_real, phi_imag = _reshape_real_imag(phi, dim) diag_value = prefactor_1**2 * ( qml.math.dot(phi_real, phi_real) + qml.math.dot(phi_imag, phi_imag) ) L = qml.math.scatter_element_add(L, (j, j), diag_value) lam = psi * 1.0 lam_real, lam_imag = _reshape_real_imag(lam, dim) # this entry is missing a factor of 1j value = prefactor_1 * ( qml.math.dot(lam_real, phi_real) + qml.math.dot(lam_imag, phi_imag) ) T = qml.math.scatter_element_add(T, (j,), value) for i in range(j - 1, -1, -1): # after first iteration of inner loop: apply U_{i+1}^\dagger if i < j - 1: phi = qml.devices.qubit.apply_operation( qml.adjoint(trainable_operations[i + 1], lazy=False), phi ) # apply V_{i}^\dagger for op in reversed(group_after_trainable_op[i]): adj_op = qml.adjoint(op, lazy=False) phi = qml.devices.qubit.apply_operation(adj_op, phi) lam = qml.devices.qubit.apply_operation(adj_op, lam) inner_op = trainable_operations[i] # extract and apply G_i generator_2, prefactor_2 = qml.generator(inner_op) # this state vector is missing a factor of 1j * prefactor_2 mu = qml.devices.qubit.apply_operation(generator_2, lam) phi_real, phi_imag = _reshape_real_imag(phi, dim) mu_real, mu_imag = _reshape_real_imag(mu, dim) # this entry is missing a factor of 1j * (-1j) = 1, i.e. none value = ( prefactor_1 * prefactor_2 * (qml.math.dot(mu_real, phi_real) + qml.math.dot(mu_imag, phi_imag)) ) L = qml.math.scatter_element_add( L, [(i, j), (j, i)], value * qml.math.convert_like(qml.math.ones((2,)), value) ) # apply U_i^\dagger lam = qml.devices.qubit.apply_operation(qml.adjoint(inner_op, lazy=False), lam) # apply U_j and V_j psi = qml.devices.qubit.apply_operation(outer_op, psi) for op in group_after_trainable_op[j]: psi = qml.devices.qubit.apply_operation(op, psi) # postprocessing: combine L and T into the metric tensor. # We require outer(conj(T), T) here, but as we skipped the factor 1j above, # the stored T is real-valued. Thus we have -1j*1j*outer(T, T) = outer(T, T) metric_tensor = L - qml.math.tensordot(T, T, 0) return metric_tensor return [tape], processing_fn