# ignore waring 
import warnings
warnings.filterwarnings("ignore")

# Import packages needed
import time
import numpy as np
from math import pi
import paddle
from paddle_quantum.ansatz import Circuit
from paddle_quantum.linalg import dagger
from paddle_quantum.loss import ExpecVal
from paddle_quantum.state import zero_state

# Drawing tools
from matplotlib import pyplot as plt

/Users/v_zhanglei48/opt/anaconda3/envs/pq/lib/python3.8/site-packages/paddle/tensor/creation.py:125: DeprecationWarning: `np.object` is a deprecated alias for the builtin `object`. To silence this warning, use `object` by itself. Doing this will not modify any behavior and is safe. 
Deprecated in NumPy 1.20; for more details and guidance: https://numpy.org/devdocs/release/1.20.0-notes.html#deprecations
  if data.dtype == np.object:
/Users/v_zhanglei48/opt/anaconda3/envs/pq/lib/python3.8/site-packages/paddle/tensor/creation.py:125: DeprecationWarning: `np.object` is a deprecated alias for the builtin `object`. To silence this warning, use `object` by itself. Doing this will not modify any behavior and is safe. 
Deprecated in NumPy 1.20; for more details and guidance: https://numpy.org/devdocs/release/1.20.0-notes.html#deprecations
  if data.dtype == np.object:

def rand_circuit(target, num_qubits, theta=None):
    # Initialize the quantum circuit
    cir = Circuit(num_qubits)
    
    # Fixed-angle Ry rotation gates 
    cir.ry(param=pi / 4)

    # ============== First layer ==============
    # Fixed-angle Ry rotation gates 
    for i in range(num_qubits):
        if target[i] == 0:
            cir.rz(i, param=theta[i] if theta is not None else theta)
        elif target[i] == 1:
            cir.ry(i, param=theta[i] if theta is not None else theta)
        else:
            cir.rx(i, param=theta[i] if theta is not None else theta)
            
    # ============== Second layer ==============
    # Build adjacent CZ gates
    for i in range(num_qubits - 1):
        cir.cz([i, i + 1])
        
    return cir

# Hyper parameter settings
# np.random.seed(42)   # Fixed Numpy random seed
N = 2                # Set the number of qubits
samples = 300        # Set the number of sampled random network structures
THETA_SIZE = N       # Set the size of the parameter theta
ITR = 1              # Set the number of iterations
LR = 0.2             # Set the learning rate
SEED = 1             # Fixed the randomly initialized seed in the optimizer

# Initialize the register for the gradient value
grad_info = []

# paddle.seed(SEED)
class manual_gradient(paddle.nn.Layer):
    
    # Initialize a list of learnable parameters and fill the initial value with a uniform distribution of [0, 2*pi]
    def __init__(self, shape, param_attr=paddle.nn.initializer.Uniform(low=0.0, high=2*pi), dtype='float32'):
        super(manual_gradient, self).__init__()
        
        # Convert Numpy array to Tensor in PaddlePaddle
        self.H = zero_state(N).data
        
    # Define loss function and forward propagation mechanism  
    def forward(self):
        
        # Initialize three theta parameter lists
        theta_np = np.random.uniform(low=0., high=2*pi, size=(THETA_SIZE))
        theta_plus_np = np.copy(theta_np) 
        theta_minus_np = np.copy(theta_np) 
        
        # Modified to calculate analytical gradient
        theta_plus_np[0] += np.pi/2
        theta_minus_np[0] -= np.pi/2
        
        # Convert Numpy array to Tensor in PaddlePaddle
        theta_plus = paddle.to_tensor(theta_plus_np)
        theta_minus = paddle.to_tensor(theta_minus_np)
        
        # Generate random targets, randomly select circuit gates in rand_circuit
        target = np.random.choice(3, N)      
        
        U_plus = rand_circuit(target, N, theta_plus).unitary_matrix()
        U_minus = rand_circuit(target, N, theta_minus).unitary_matrix()

        # Calculate the analytical gradient
        grad = paddle.real((dagger(U_plus) @ self.H @ U_plus)[0][0] - (dagger(U_minus) @ self.H @ U_minus)[0][0])/2  

        return grad

# Define the main block
def main():

    # Set the dimension of QNN
    sampling = manual_gradient(shape=[THETA_SIZE])
        
    # Sampling to obtain gradient information
    grad = sampling().numpy()
        
    return grad

# Record running time
time_start = time.time()

# Start sampling
for i in range(samples):
    if __name__ == '__main__':
        grad = main()
        grad_info.append(grad)

time_span = time.time() - time_start

print('The main program segment has run in total ', time_span, ' seconds')
print("Use ", samples, " samples to get the mean value of the gradient of the random network's first parameter, and we have：", np.mean(grad_info))
print("Use ", samples, "samples to get the variance of the gradient of the random network's first parameter, and we have：", np.var(grad_info))

/Users/v_zhanglei48/opt/anaconda3/envs/pq/lib/python3.8/site-packages/paddle/fluid/framework.py:1104: DeprecationWarning: `np.bool` is a deprecated alias for the builtin `bool`. To silence this warning, use `bool` by itself. Doing this will not modify any behavior and is safe. If you specifically wanted the numpy scalar type, use `np.bool_` here.
Deprecated in NumPy 1.20; for more details and guidance: https://numpy.org/devdocs/release/1.20.0-notes.html#deprecations
  elif dtype == np.bool:

The main program segment has run in total  2.2558279037475586  seconds
Use  300  samples to get the mean value of the gradient of the random network's first parameter, and we have： -0.0032896693
Use  300 samples to get the variance of the gradient of the random network's first parameter, and we have： 0.098623686

time_start = time.time()
N = 2

# Set the image ratio Vertical: Horizontal = 0.3
fig = plt.figure(figsize=plt.figaspect(0.3))

# Generate points on the x, y axis
X = np.linspace(0, 2 * np.pi, 80)
Y = np.linspace(0, 2 * np.pi, 80)

# Generate 2D mesh
xx, yy = np.meshgrid(X, Y)


# Define the necessary logic gates
def rx(theta):
    mat = np.array([[np.cos(theta/2), -1j * np.sin(theta/2)],
                    [-1j * np.sin(theta/2), np.cos(theta/2)]])
    return mat

def ry(theta):
    mat = np.array([[np.cos(theta/2), -1 * np.sin(theta/2)],
                    [np.sin(theta/2), np.cos(theta/2)]])
    return mat

def rz(theta):
    mat = np.array([[np.exp(-1j * theta/2), 0],
                    [0, np.exp(1j * theta/2)]])
    return mat

def CZ():
    mat = np.array([[1,0,0,0],[0,1,0,0],[0,0,1,0],[0,0,0,-1]])
    return mat

# ============= The first figure =============
# We visualize the case where the second layer is kron(Ry, Ry)
ax = fig.add_subplot(1, 2, 1, projection='3d')

# Forward propagation to calculate loss function:
def cost_yy(para):
    L1 = np.kron(ry(np.pi/4), ry(np.pi/4))
    L2 = np.kron(ry(para[0]), ry(para[1]))
    U = np.matmul(np.matmul(L1, L2), CZ())
    H = np.zeros((2 ** N, 2 ** N))
    H[0, 0] = 1
    val = (U.conj().T @ H@ U).real[0][0]
    return val

# Draw an image
Z = np.array([[cost_yy([x, y]) for x in X] for y in Y]).reshape(len(Y), len(X))
surf = ax.plot_surface(xx, yy, Z, cmap='plasma')
ax.set_xlabel(r"$\theta_1$")
ax.set_ylabel(r"$\theta_2$")
ax.set_title("Optimization Landscape for Ry-Ry Layer")

# ============= The second figure =============
# We visualize the case where the second layer is kron(Rx, Rz)
ax = fig.add_subplot(1, 2, 2, projection='3d')


def cost_xz(para):
    L1 = np.kron(ry(np.pi/4), ry(np.pi/4))
    L2 = np.kron(rx(para[0]), rz(para[1]))
    U = np.matmul(np.matmul(L1, L2), CZ())
    H = np.zeros((2 ** N, 2 ** N))
    H[0, 0] = 1
    val = (U.conj().T @ H @ U).real[0][0]
    return val

Z = np.array([[cost_xz([x, y]) for x in X] for y in Y]).reshape(len(Y), len(X))
surf = ax.plot_surface(xx, yy, Z, cmap='viridis')
ax.set_xlabel(r"$\theta_1$")
ax.set_ylabel(r"$\theta_2$")
ax.set_title("Optimization Landscape for Rx-Rz Layer")


plt.show()

time_span = time.time() - time_start        
print('The main program segment has run in total ', time_span, ' seconds')

The main program segment has run in total  1.5701446533203125  seconds

# Import related modules from Paddle Quantum and PaddlePaddle
from paddle_quantum.qinfo import pauli_str_to_matrix, random_pauli_str_generator
from paddle_quantum.hamiltonian import Hamiltonian
# GradTool package
from paddle_quantum.gradtool import random_sample, show_gradient, plot_loss_grad, show_gradient

# objective function
def loss_func(circuit: Circuit, H: Hamiltonian) -> paddle.Tensor:
    expec_val = ExpecVal(H)
    return expec_val(circuit())

# Hyper parameter settings
#np.random.seed(1)   # Fixed Numpy random seed
N = 2                # Set the number of qubits
samples = 300        # Set the number of sampled random network structures
THETA_SIZE = N       # Set the size of the parameter theta
ITR = 120            # Set the number of iterations
LR = 0.1             # Set the learning rate
SEED = 1             # Fixed the randomly initialized seed in the optimizer

# paddle.seed(SEED)
target = np.random.choice(3, N)
# Random generate parameters between 0 and 2*Pi 
cir = rand_circuit(target, N)
print(cir)
# Random generate Hamiltonian information, in Pauli string format
H_l = Hamiltonian(random_pauli_str_generator(N, terms=7))
print('Hamiltonian info: \n', H_l)

--Ry(0.785)----Rz(5.325)----*--
                            |  
--Ry(0.785)----Rx(3.479)----z--
                               
Hamiltonian info: 
 0.7469285407889965 X0, X1
-0.36732514676253114 Y0
0.14368811242599788 Z0
0.5751598291922848 Y0, Y1
0.12302397651276697 Y0, Z1
-0.07083710973626145 Y1
-0.054905066805228886 X0

grad_mean_list, grad_variance_list = random_sample(cir, loss_func, samples, H_l, mode='single', param=0)

Sampling: 100%|##################################################| 300/300 [00:02<00:00, 111.88it/s]

Mean of gradient for all parameters: 
theta 1 :  -0.00420132
theta 2 :  -0.004461403
Variance of gradient for all parameters: 
theta 1 :  0.08278141
theta 2 :  0.04159966

plot_loss_grad(cir, loss_func, ITR, LR, H_l)

Training:   0%|                                                             | 0/120 [00:00<?, ?it/s]/Users/v_zhanglei48/opt/anaconda3/envs/pq/lib/python3.8/site-packages/paddle/tensor/creation.py:125: DeprecationWarning: `np.object` is a deprecated alias for the builtin `object`. To silence this warning, use `object` by itself. Doing this will not modify any behavior and is safe. 
Deprecated in NumPy 1.20; for more details and guidance: https://numpy.org/devdocs/release/1.20.0-notes.html#deprecations
  if data.dtype == np.object:
/Users/v_zhanglei48/opt/anaconda3/envs/pq/lib/python3.8/site-packages/paddle/fluid/framework.py:1104: DeprecationWarning: `np.bool` is a deprecated alias for the builtin `bool`. To silence this warning, use `bool` by itself. Doing this will not modify any behavior and is safe. If you specifically wanted the numpy scalar type, use `np.bool_` here.
Deprecated in NumPy 1.20; for more details and guidance: https://numpy.org/devdocs/release/1.20.0-notes.html#deprecations
  elif dtype == np.bool:
Training: 100%|##################################################| 120/120 [00:01<00:00, 110.56it/s]

loss, grad = show_gradient(cir, loss_func, ITR, LR, H_l)
H_matrix = H_l.construct_h_matrix()

print("optimal result: ", loss[-1])
print("real energy：", np.linalg.eigh(H_matrix)[0][0])

Training: 100%|##################################################| 120/120 [00:01<00:00, 115.10it/s]

optimal result:  -0.5158533
real energy： -1.400689

# Hyper parameter settings
selected_qubit = [2, 4, 6, 8]
means, variances = [], []

# Keep increasing the number of qubits
for N in selected_qubit:
    grad_info = []
    THETA_SIZE = N                
    target = np.random.choice(3, N)
    # Generate a value from 0 to 2PI
    cir = rand_circuit(target, N)
    
    H_l = Hamiltonian(random_pauli_str_generator(N, terms=10))
    
    grad_mean_list, grad_variance_list = random_sample(cir, loss_func, samples, H_l, mode='max')
    # Record sampling information
    means.append(grad_mean_list)
    variances.append(grad_variance_list)

Sampling: 100%|##################################################| 300/300 [00:02<00:00, 114.13it/s]

Mean of max gradient
0.48790267
Variance of max gradient
0.05380149

Sampling:   0%|                                                             | 0/300 [00:00<?, ?it/s]/Users/v_zhanglei48/opt/anaconda3/envs/pq/lib/python3.8/site-packages/paddle/tensor/creation.py:125: DeprecationWarning: `np.object` is a deprecated alias for the builtin `object`. To silence this warning, use `object` by itself. Doing this will not modify any behavior and is safe. 
Deprecated in NumPy 1.20; for more details and guidance: https://numpy.org/devdocs/release/1.20.0-notes.html#deprecations
  if data.dtype == np.object:
/Users/v_zhanglei48/opt/anaconda3/envs/pq/lib/python3.8/site-packages/paddle/fluid/framework.py:1104: DeprecationWarning: `np.bool` is a deprecated alias for the builtin `bool`. To silence this warning, use `bool` by itself. Doing this will not modify any behavior and is safe. If you specifically wanted the numpy scalar type, use `np.bool_` here.
Deprecated in NumPy 1.20; for more details and guidance: https://numpy.org/devdocs/release/1.20.0-notes.html#deprecations
  elif dtype == np.bool:
Sampling: 100%|###################################################| 300/300 [00:05<00:00, 59.67it/s]

Mean of max gradient
0.558792
Variance of max gradient
0.08236147

Sampling:   0%|                                                             | 0/300 [00:00<?, ?it/s]/Users/v_zhanglei48/opt/anaconda3/envs/pq/lib/python3.8/site-packages/paddle/tensor/creation.py:125: DeprecationWarning: `np.object` is a deprecated alias for the builtin `object`. To silence this warning, use `object` by itself. Doing this will not modify any behavior and is safe. 
Deprecated in NumPy 1.20; for more details and guidance: https://numpy.org/devdocs/release/1.20.0-notes.html#deprecations
  if data.dtype == np.object:
/Users/v_zhanglei48/opt/anaconda3/envs/pq/lib/python3.8/site-packages/paddle/fluid/framework.py:1104: DeprecationWarning: `np.bool` is a deprecated alias for the builtin `bool`. To silence this warning, use `bool` by itself. Doing this will not modify any behavior and is safe. If you specifically wanted the numpy scalar type, use `np.bool_` here.
Deprecated in NumPy 1.20; for more details and guidance: https://numpy.org/devdocs/release/1.20.0-notes.html#deprecations
  elif dtype == np.bool:
Sampling: 100%|###################################################| 300/300 [00:07<00:00, 41.93it/s]

Mean of max gradient
0.439257
Variance of max gradient
0.03570818

Sampling:   0%|                                                             | 0/300 [00:00<?, ?it/s]/Users/v_zhanglei48/opt/anaconda3/envs/pq/lib/python3.8/site-packages/paddle/tensor/creation.py:125: DeprecationWarning: `np.object` is a deprecated alias for the builtin `object`. To silence this warning, use `object` by itself. Doing this will not modify any behavior and is safe. 
Deprecated in NumPy 1.20; for more details and guidance: https://numpy.org/devdocs/release/1.20.0-notes.html#deprecations
  if data.dtype == np.object:
/Users/v_zhanglei48/opt/anaconda3/envs/pq/lib/python3.8/site-packages/paddle/fluid/framework.py:1104: DeprecationWarning: `np.bool` is a deprecated alias for the builtin `bool`. To silence this warning, use `bool` by itself. Doing this will not modify any behavior and is safe. If you specifically wanted the numpy scalar type, use `np.bool_` here.
Deprecated in NumPy 1.20; for more details and guidance: https://numpy.org/devdocs/release/1.20.0-notes.html#deprecations
  elif dtype == np.bool:
Sampling: 100%|###################################################| 300/300 [00:08<00:00, 37.20it/s]

Mean of max gradient
0.14468974
Variance of max gradient
0.003597733

means = np.array(means)
variances = np.array(variances)

n = np.array(selected_qubit)
print("We then draw the statistical results of this sampled gradient:")
fig = plt.figure(figsize=plt.figaspect(0.3))

# ============= The first figure =============
# Calculate the relationship between the average gradient of random sampling and the number of qubits
plt.subplot(1, 2, 1)
plt.plot(n, means, "o-.")
plt.xlabel(r"Qubit #")
plt.ylabel(r"$ \partial \theta_{i} \langle 0|H |0\rangle$ Mean")
plt.title("Mean of {} sampled gradient".format(samples))
plt.xlim([1,9])
plt.grid()

# ============= The second figure =============
# Calculate the relationship between the variance of the randomly sampled gradient and the number of qubits
plt.subplot(1, 2, 2)
plt.plot(n, np.log(variances), "v-")
plt.xlabel(r"Qubit #")
plt.ylabel(r"$ \partial \theta_{i} \langle 0|H |0\rangle$ Variance")
plt.title("Variance of {} sampled gradient".format(samples))
plt.xlim([1,9])
plt.grid()

plt.show()

We then draw the statistical results of this sampled gradient:

from paddle_quantum.dataset import Iris
from paddle_quantum.gradtool import random_sample_supervised, plot_supervised_loss_grad

def U_theta(n: int, depth: int):
    # Initialize the quantum circuit
    cir = Circuit(n)

    # rotation gates 
    cir.rz()
    cir.ry()
    cir.rz()

    # default depth = 1
    # Build adjacent CNOT gates and RY rotation gates 
    for _ in range(3, depth + 3):
        cir.cnot()
        cir.ry()
        
    return cir

def loss_func(cir: Circuit, *args):
    # input the quantum states and training labels
    state_in = args[0]
    label = args[1]
    # Convert Numpy array to tensor
    label_pp = paddle.to_tensor(label).reshape([-1, 1])
    
    Utheta = cir.unitary_matrix()
    
    # Since Utheta is learned, we use row vector operations here to speed up the training without affecting the results
    state_out = state_in @ Utheta
    
    # Measure the expected value of the Pauli Z operator <Z>
    Ob = paddle.to_tensor(pauli_str_to_matrix([[1.0, 'z0']], qubit_num))
    E_Z = state_out @ Ob @ paddle.transpose(paddle.conj(state_out), perm=[0, 2, 1])

    # Mapping <Z> into label 
    state_predict = paddle.real(E_Z)[:, 0] * 0.5 + 0.5
    loss = paddle.mean((state_predict - label_pp) ** 2) # mean-squared error
    
    return loss

time_start = time.time()

# Hyper parameter settings
test_rate = 0.2
qubit_num = 2 # Don't give too many qubits, otherwise it will be seriously overfitted
depth = 1
lr = 0.1
BATCH = 4
EPOCH = 4
SAMPLE = 300

# dataset
iris = Iris(encoding='amplitude_encoding', num_qubits=qubit_num, test_rate=test_rate, classes=[0,1], return_state=True)

# Get inputs and labels for the dataset
train_x, train_y = iris.train_x, iris.train_y  # train_x, test_x here is paddle.tensor type,  train_y，test_y here is ndarray type.
test_x, test_y = iris.test_x, iris.test_y
testing_data_num = len(test_y)
training_data_num = len(train_y)


# Creating trainable parameters for circuits
# Creating Circuits
circuit = U_theta(qubit_num, depth)

print(circuit)

--Rz(5.714)----Ry(4.260)----Rz(5.514)----*----x----Ry(4.171)--
                                         |    |               
--Rz(0.917)----Ry(0.867)----Rz(4.504)----x----*----Ry(3.387)--

/Users/v_zhanglei48/opt/anaconda3/envs/pq/lib/python3.8/site-packages/paddle/fluid/framework.py:1104: DeprecationWarning: `np.bool` is a deprecated alias for the builtin `bool`. To silence this warning, use `bool` by itself. Doing this will not modify any behavior and is safe. If you specifically wanted the numpy scalar type, use `np.bool_` here.
Deprecated in NumPy 1.20; for more details and guidance: https://numpy.org/devdocs/release/1.20.0-notes.html#deprecations
  elif dtype == np.bool:

loss,grad = plot_supervised_loss_grad(circuit, loss_func, N=qubit_num, EPOCH=EPOCH, LR=lr,BATCH=BATCH, TRAIN_X=train_x, TRAIN_Y=train_y)

mean, variance = random_sample_supervised(circuit,loss_func, N=qubit_num, sample_num=SAMPLE, BATCH=BATCH, TRAIN_X=train_x, TRAIN_Y=train_y, mode='max')

Sampling: 100%|##################################################| 300/300 [00:02<00:00, 122.85it/s]

Mean of max gradient
0.15121777
Variance of max gradient
0.0036665837

Barren Plateaus¶

Overview¶

Random network structure¶

Loss function and optimization landscape¶

Visualization of the Optimization landscape¶

Gradient Analysis Tool¶

Application I: Unsupervised Learning¶

Paddle Quantum Implement¶

Define Quantum Circuits¶

Define Objective Function¶

More qubits¶

Application II: Quantum encoded classical data¶

Paddle Quantum Implement¶

Define Quantum Circuits¶

Define Objective Function¶

Define the dataset¶

Summary¶

References¶