Source code for qiskit_algorithms.gradients.reverse.reverse_qgt

# This code is part of a Qiskit project.
#
# (C) Copyright IBM 2023.
#
# This code is licensed under the Apache License, Version 2.0. You may
# obtain a copy of this license in the LICENSE.txt file in the root directory
# of this source tree or at http://www.apache.org/licenses/LICENSE-2.0.
#
# Any modifications or derivative works of this code must retain this
# copyright notice, and modified files need to carry a notice indicating
# that they have been altered from the originals.

"""QGT with the classically efficient reverse mode."""

from __future__ import annotations
from collections.abc import Sequence
from typing import cast, List
import logging

import numpy as np

from qiskit.circuit import QuantumCircuit, Parameter
from qiskit.quantum_info import Statevector
from qiskit.providers import Options
from qiskit.primitives import Estimator

from ..base.base_qgt import BaseQGT
from ..base.qgt_result import QGTResult
from ..utils import DerivativeType

from .split_circuits import split
from .bind import bind
from .derive_circuit import derive_circuit

logger = logging.getLogger(__name__)


[docs]class ReverseQGT(BaseQGT): """QGT calculation with the classically efficient reverse mode. .. note:: This QGT implementation is based on statevector manipulations and scales exponentially with the number of qubits. However, for small system sizes it can be very fast compared to circuit-based gradients. This class implements the calculation of the QGT as described in [1]. By keeping track of three statevectors and iteratively sweeping through each parameterized gate, this method scales only quadratically with the number of parameters. **References:** [1]: Jones, T. "Efficient classical calculation of the Quantum Natural Gradient" (2020). `arXiv:2011.02991 <https://arxiv.org/abs/2011.02991>`_. """ SUPPORTED_GATES = ["rx", "ry", "rz", "cp", "crx", "cry", "crz"] def __init__( self, phase_fix: bool = True, derivative_type: DerivativeType = DerivativeType.COMPLEX ): """ Args: phase_fix: Whether or not to include the phase fix. derivative_type: Determines whether the complex QGT or only the real or imaginary parts are calculated. """ dummy_estimator = Estimator() # this method does not need an estimator super().__init__(dummy_estimator, phase_fix, derivative_type) @property def options(self) -> Options: """There are no options for the reverse QGT, returns an empty options dict. Returns: Empty options. """ return Options() def _run( # pylint: disable=arguments-renamed self, circuits: Sequence[QuantumCircuit], parameter_values: Sequence[Sequence[float]], parameters: Sequence[Sequence[Parameter]], **options, ) -> QGTResult: """Compute the QGT on the given circuits.""" g_circuits, g_parameter_values, g_parameter_sets = self._preprocess( circuits, parameter_values, parameters, self.SUPPORTED_GATES ) results = self._run_unique(g_circuits, g_parameter_values, g_parameter_sets, **options) return self._postprocess(results, circuits, parameter_values, parameters) def _run_unique( self, circuits: Sequence[QuantumCircuit], parameter_values: Sequence[Sequence[float]], parameter_sets: Sequence[Sequence[Parameter]], **options, # pylint: disable=unused-argument ) -> QGTResult: num_qgts = len(circuits) qgts = [] metadata = [] for k in range(num_qgts): values = np.asarray(parameter_values[k]) circuit = circuits[k] parameters = list(parameter_sets[k]) num_parameters = len(parameters) original_parameter_order = [p for p in circuit.parameters if p in parameters] metadata.append({"parameters": original_parameter_order}) unitaries, paramlist = split(circuit, parameters=parameters) # initialize the phase fix vector and the hessian part ``metric`` num_parameters = len(unitaries) phase_fixes = np.zeros(num_parameters, dtype=complex) metric = np.zeros((num_parameters, num_parameters), dtype=complex) # initialize the state variables -- naming convention is the same as the paper parameter_binds = dict(zip(circuit.parameters, values)) bound_unitaries = cast(List[QuantumCircuit], bind(unitaries, parameter_binds)) chi = Statevector(bound_unitaries[0]) psi = chi.copy() phi = Statevector.from_int(0, (2,) * circuit.num_qubits) # Get the analytic gradient of the first unitary # Note: We currently only support gates with a single parameter -- which is reflected # in self.SUPPORTED_GATES -- but generally we could also support gates with multiple # parameters per gate. This is the reason for the second 0-index. deriv = derive_circuit(unitaries[0], paramlist[0][0]) for _, gate in deriv: bind(gate, parameter_binds, inplace=True) grad_coeffs = [coeff for coeff, _ in deriv] grad_states = [phi.evolve(gate) for _, gate in deriv] # compute phase fix (optional) and the hessian part if self._phase_fix: phase_fixes[0] = _phasefix_term(chi, grad_coeffs, grad_states) metric[0, 0] = _l_term(grad_coeffs, grad_states, grad_coeffs, grad_states) for j in range(1, num_parameters): lam = psi.copy() phi = psi.copy() # get the analytic gradient d U_j / d p_j and apply it deriv = derive_circuit(unitaries[j], paramlist[j][0]) for _, gate in deriv: bind(gate, parameter_binds, inplace=True) # compute |phi> (in general it's a sum of states and coeffs) grad_coeffs = [coeff for coeff, _ in deriv] grad_states = [phi.evolve(gate) for _, gate in deriv] # compute the diagonal element L_{j, j} metric[j, j] += _l_term(grad_coeffs, grad_states, grad_coeffs, grad_states) # compute the off diagonal elements L_{i, j} for i in reversed(range(j)): # apply U_{i + 1}_dg unitary_ip_inv = bound_unitaries[i + 1].inverse() grad_states = [state.evolve(unitary_ip_inv) for state in grad_states] lam = lam.evolve(bound_unitaries[i].inverse()) # get the gradient d U_i / d p_i and apply it deriv = derive_circuit(unitaries[i], paramlist[i][0]) for _, gate in deriv: bind(gate, parameter_binds, inplace=True) grad_coeffs_mu = [coeff for coeff, _ in deriv] grad_states_mu = [lam.evolve(gate) for _, gate in deriv] metric[i, j] += _l_term( grad_coeffs_mu, grad_states_mu, grad_coeffs, grad_states ) if self._phase_fix: phase_fixes[j] += _phasefix_term(chi, grad_coeffs, grad_states) psi = psi.evolve(bound_unitaries[j]) # The following code stacks the QGT together and maps the values into the # correct original order of parameters # map circuit parameter to global index in the circuit param_to_circuit = { param: index for index, param in enumerate(original_parameter_order) } # map global index to the local index used in the calculation, the new index can # now be accessed by remap[index] remap = { index: param_to_circuit[_extract_parameter(plist[0])] for index, plist in enumerate(paramlist) } qgt = np.zeros((num_parameters, num_parameters), dtype=complex) for i in range(num_parameters): iloc = remap[i] for j in range(num_parameters): jloc = remap[j] if i <= j: qgt[iloc, jloc] += metric[i, j] else: qgt[iloc, jloc] += np.conj(metric[j, i]) qgt[iloc, jloc] -= np.conj(phase_fixes[i]) * phase_fixes[j] # append and cast to real/imag if required qgts.append(self._to_derivtype(qgt)) result = QGTResult(qgts, self.derivative_type, metadata, options=None) return result def _to_derivtype(self, qgt): if self.derivative_type == DerivativeType.REAL: return np.real(qgt) if self.derivative_type == DerivativeType.IMAG: return np.imag(qgt) return qgt
def _l_term(coeffs_i, states_i, coeffs_j, states_j): return sum( sum( np.conj(coeff_i) * coeff_j * np.conj(state_i.data).dot(state_j.data) for coeff_i, state_i in zip(coeffs_i, states_i) ) for coeff_j, state_j in zip(coeffs_j, states_j) ) def _phasefix_term(chi, coeffs, states): return sum( coeff_i * np.conj(chi.data).dot(state_i.data) for coeff_i, state_i in zip(coeffs, states) ) def _extract_parameter(expression): if isinstance(expression, Parameter): return expression if len(expression.parameters) > 1: raise ValueError("Expression has more than one parameter.") return list(expression.parameters)[0]