Higher order gradient with the device default.mixed

Double_Fan · August 10, 2022, 11:35am

Hi, I am trying the get the second-order gradient during the training. I started with the default.qubit device and it worked properly. However, when I changed it to the default, I mixed to see the effect of the noise on the performance. The output of the second order gradient calculation is None.

Does anyone know what is the reason for this and help me out? Is it because it is not supported for other devices so far?

Thanks in advance

isaacdevlugt · August 10, 2022, 1:29pm

Hey @Double_Fan! Is it possible for you to supply your code?

Double_Fan · August 10, 2022, 3:35pm

Hey @isaacdevlugt, Here is the code. The value of dx2 is None with the default.mixed device

class Model():
    def __init__(self, n_layers=20, **kwargs):
        super().__init__(**kwargs)
        self.circuit = Circuit()
        self.train_op = tf.keras.optimizers.Adam(learning_rate=0.001)
        self.x_extra = tf.Variable(x_extra, trainable = False)

    def run(self, X):
        return self.circuit(X)
    
    def get_loss(self, X, Y):
        predicts = self.run(X)
        loss1 = tf.math.reduce_mean(tf.math.square(predicts-Y))
        
        with tf.GradientTape(persistent=True) as tape:
            tape.watch(self.x_extra)
            y_extra = self.run(self.x_extra)
            dx = tape.gradient(y_extra, self.x_extra)
            dx2 = tape.gradient(dx, self.x_extra)
            
  
        return loss1   
    
    def get_grad(self,X,Y):
        with tf.GradientTape(persistent=True) as tape:
            tape.watch(self.circuit.variables)
            L = self.get_loss(X,Y) 
            g = tape.gradient(L, self.circuit.variables)
        return g
    
    def network_learn(self,X,Y):
        g = self.get_grad(X,Y)
        self.train_op.apply_gradients(zip(g, self.circuit.variables))

isaacdevlugt · August 10, 2022, 8:28pm

It looks like there are missing bits of code that I need to create an instance of the Model class . Can you send an entire working example?

Double_Fan · August 10, 2022, 10:05pm

Here is an example, in which the x, y, and x_extra can be some random values, e.g. they are all equal to 0.5.

dev = qml.device("default.mixed", wires=1)

@qml.qnode(dev, interface="tf")
def qcircuit(params, x):
    qml.Rot(0, x[0], 0, wires=0)    
    qml.Rot(params[0],params[1],params[2], wires=0)
    return qml.expval(qml.PauliZ(0))

class Circuit(tf.keras.layers.Layer):
    def __init__(self):
        super(Circuit, self).__init__()
        theta_init = tf.random_uniform_initializer(minval=0.0, maxval=np.pi)
        self.params = tf.Variable(initial_value=theta_init(shape=(3,), dtype="float32"), trainable=True, name="thetas")
      
    def call(self, inputs):
        preds = []
        for i in range(inputs.shape[0]):
            pred = qcircuit(self.params, inputs[i])
            preds.append([pred])
        return tf.convert_to_tensor(preds, dtype=tf.float32)

class Circuit(tf.keras.layers.Layer):
    def __init__(self):
        super(Circuit, self).__init__()
        theta_init = tf.random_uniform_initializer(minval=0.0, maxval=np.pi)
        self.params = tf.Variable(initial_value=theta_init(shape=(3,), dtype="float32"), trainable=True, name="thetas")
      
    def call(self, inputs):
        preds = []
        for i in range(inputs.shape[0]):
            pred = qcircuit(self.params, inputs[i])
            preds.append([pred])
        return tf.convert_to_tensor(preds, dtype=tf.float32)

model= Model()
model.network_learn(x,y)

isaacdevlugt · August 11, 2022, 12:11pm

Are you able to share a minimal example with inputs and outputs along with your exact error message?

Double_Fan · August 11, 2022, 12:39pm

For the inputs, you can try the following:

x = np.array([[0.5]])
y = np.array([[0.5]])
x_extra = np.array([[0.5]])

Given the device ‘default.mixed’, if you print the value of dx2, it is None, but if you change the device to ‘default.qubit’, you will get a real value. I have no idea what is the reason for that.

isaacdevlugt · August 12, 2022, 1:46pm

Hey @Double_Fan! I can’t seem to reproduce your error. Here is the code that I’m running and the outputs:

import pennylane as qml
import tensorflow as tf

from pennylane import numpy as np

print(qml.__version__) # 0.24.0 for me
print(tf.__version__) # 2.9.1 for me

dev = qml.device("default.mixed", wires=1)

@qml.qnode(dev, interface="tf")
def qcircuit(params, x):
    qml.Rot(0, x[0], 0, wires=0)    
    qml.Rot(params[0],params[1],params[2], wires=0)
    return qml.expval(qml.PauliZ(0))

class Circuit(tf.keras.layers.Layer):
    def __init__(self):
        super(Circuit, self).__init__()
        theta_init = tf.random_uniform_initializer(minval=0.0, maxval=np.pi)
        self.params = tf.Variable(initial_value=theta_init(shape=(3,), dtype="float32"), trainable=True, name="thetas")
      
    def call(self, inputs):
        preds = []
        for i in range(inputs.shape[0]):
            pred = qcircuit(self.params, inputs[i])
            preds.append([pred])
        return tf.convert_to_tensor(preds, dtype=tf.float32)

class Circuit(tf.keras.layers.Layer):
    def __init__(self):
        super(Circuit, self).__init__()
        theta_init = tf.random_uniform_initializer(minval=0.0, maxval=np.pi)
        self.params = tf.Variable(initial_value=theta_init(shape=(3,), dtype="float32"), trainable=True, name="thetas")
      
    def call(self, inputs):
        preds = []
        for i in range(inputs.shape[0]):
            pred = qcircuit(self.params, inputs[i])
            preds.append([pred])
        return tf.convert_to_tensor(preds, dtype=tf.float32)

class Model():
    def __init__(self, n_layers=20, **kwargs):
        super().__init__(**kwargs)
        self.circuit = Circuit()
        self.train_op = tf.keras.optimizers.Adam(learning_rate=0.001)
        self.x_extra = tf.Variable(x_extra, trainable = False)

    def run(self, X):
        return self.circuit(X)
    
    def get_loss(self, X, Y):
        predicts = self.run(X)
        loss1 = tf.math.reduce_mean(tf.math.square(predicts-Y))
        
        with tf.GradientTape(persistent=True) as tape:
            tape.watch(self.x_extra)
            y_extra = self.run(self.x_extra)
            dx = tape.gradient(y_extra, self.x_extra)
            dx2 = tape.gradient(dx, self.x_extra)
        
        print(dx2)
  
        return loss1   
    
    def get_grad(self,X,Y):
        with tf.GradientTape(persistent=True) as tape:
            tape.watch(self.circuit.variables)
            L = self.get_loss(X,Y) 
            g = tape.gradient(L, self.circuit.variables)
        return g
    
    def network_learn(self,X,Y):
        g = self.get_grad(X,Y)
        print(g)
        self.train_op.apply_gradients(zip(g, self.circuit.variables))

x = np.array([[0.5]])
y = np.array([[0.5]])
x_extra = np.array([[0.5]])

model= Model()
model.network_learn(x,y)

"""
Outputs:

From print(dx2):

tf.Tensor([[-0.88553823]], shape=(1, 1), dtype=float64) 

From print(g):

[<tf.Tensor: shape=(3,), dtype=float32, numpy=array([ 5.7883937e-02, -1.7684884e-02,  3.4694470e-18], dtype=float32)>] # print(g)
"""

Double_Fan · August 12, 2022, 3:33pm

Hi, @isaacdevlugt, Thanks a lot . It works now. I guess it is because of the version of pennylane I was using.

isaacdevlugt · August 12, 2022, 3:52pm

Awesome! Glad it was an easy fix

Topic		Replies	Views
TypeError while computing the gradient PennyLane Help	20	3534	May 18, 2021
Gradient Propagation Through Hybrid Quantum/Classical Networks PennyLane Help	5	240	March 11, 2024
Using PyTorch Gradients PennyLane Help	9	3060	January 5, 2021
Extracting the gradient information from a QNode for fixed parameters PennyLane Help	6	953	September 24, 2020
Gradients of quantum generator with tf.interface is none PennyLane Help	12	1022	May 23, 2021

Higher order gradient with the device default.mixed

Related topics