[RFC] [Language] Quantum allocation with state initialization #1086

amccaskey · 2024-01-11T19:14:36Z

TODO:

Example with #1467

kernel(cudaq::state& initState) {
  cudaq::qvector q = initState;
}

def kernel(initState : cudaq.state):
   q = cudaq.qvector(initState)

I propose we update the language to support quantum allocation with user-provided initial state specification. This should supersede functions like from_state(...) on the kernel_builder.

C++:

New constructors

  qubit::qubit(const vector<complex<double>>&);
  qubit::qubit(const initializer_list<complex<double>>&);
  qvector::qvector(const vector<complex<double>>&);
  qvector::qvector(const initializer_list<complex<double>>&);

New builder method

  QuakeValue qalloc(vector<complex<double>> &)

Python

The Python builder would be similar as in the following.

  v = [0., 1., 1., 0.]
  qubits = kernel.qalloc(v)

@cudaq.kernel 
def test(vec : list[complex]):
   q = cudaq.qvector(vec)
   ...

C++ Usage

The following snippet demonstrates what this might look like:

__qpu__ auto test0() {
  // Init from state vector
  cudaq::qubit q = {0., 1.};
  return mz(q);
}

__qpu__ auto test1() {
  // Init from predefined state vectors
  cudaq::qubit q = cudaq::ket::one;
  return mz(q);
}

__qpu__ void test2() { 
  // Init from state vector
  cudaq::qubit q = {M_SQRT1_2, M_SQRT1_2}; 
}

__qpu__ void test3() { 
  // Init from state vector 
  cudaq::qvector q = {M_SQRT1_2, 0., 0., M_SQRT1_2}; 
}

__qpu__ void test4(const std::vector<cudaq::complex> &state) {
  // State vector from host 
  cudaq::qvector q = state;
}

void useBuilder() {
  std::vector<cudaq::complex> state{M_SQRT1_2, 0., 0., M_SQRT1_2}; 

  {
    // (deferred) qubit allocation from concrete state vector
    auto kernel = cudaq::make_kernel();
    auto qubitsInitialized = kernel.qalloc(state);
  }
  {
    // kernel parameterized on input state data
    auto [kernel, inState] = cudaq::make_kernel<std::vector<cudaq::complex>>();
    auto qubitsInitialized = kernel.qalloc(inState); 
   
    cudaq::sample(kernel, state).dump();
  }
}

Python usage

Vectors of complex or floating-point numbers

Notes

Implicit conversion from a list of float to a list of complex is allowed on argument passing.
Automatic conversion of initializer elements will happen if the precision of the numbers in qvector initializer does not match the current simulation precision
- Emit warning on conversion due to performance concerns, recommend using cudaq.amplitudes or cudaq.complex.

Lists

# Passing complex vectors as params
c = [.70710678 + 0j, 0., 0., 0.70710678]
@cudaq.kernel
def kernel(vec: list[complex]):
    q = cudaq.qvector(vec)

# Capturing complex vectors
c = [.70710678 + 0j, 0., 0., 0.70710678]
@cudaq.kernel
def kernel():
    q = cudaq.qvector(c)

# Capturing complex vectors and converting to 
# numpy array inside the kernel
c = [.70710678 + 0j, 0., 0., 0.70710678]
@cudaq.kernel
def kernel():
    q = cudaq.qvector(np.array(c))

# Creating complex arrays inside kernels
@cudaq.kernel
def kernel():
    q = cudaq.qvector([1.0 + 0j, 0., 0., 1.])

Numpy arrays

# From np array created inside a kernel with a complex dtype
c = [.70710678 + 0j, 0., 0., 0.70710678]
@cudaq.kernel
def kernel(vec: list[complex]):
    q = cudaq.qvector(np.array(vec, dtype=complex))

c = [.70710678 + 0j, 0., 0., 0.70710678]
@cudaq.kernel
def kernel(vec: list[complex]):
    q = cudaq.qvector(np.array(vec, dtype=np.complex64))

# Using precision-agnostic API
c = [.70710678 + 0j, 0., 0., 0.70710678]
@cudaq.kernel
def kernel(vec: list[complex]):
    q = cudaq.qvector(np.array(vec, dtype=cudaq.complex()))

c = cudaq.amplitudes([.70710678, 0., 0., 0.70710678])
@cudaq.kernel
def kernel(vec: list[complex]):
    q = cudaq.qvector(vec)


# Passing np arrays as params
c = np.array(c, dtype=cudaq.complex())
@cudaq.kernel
def kernel(vec: np.array):
    q = cudaq.qvector(vec)

c = np.array(c, dtype=cudaq.complex())
@cudaq.kernel
def kernel(vec: np.ndarray):
    q = cudaq.qvector(vec)

c = np.array(c, dtype=cudaq.complex())
@cudaq.kernel
def kernel(vec: np.ndarray[any, complex]):
    q = cudaq.qvector(vec)

cudaq.State

# Pass state as a parameter (for fp64 simulators)
c = np.array([1. / np.sqrt(2.) + 0j, 0., 0., 1. / np.sqrt(2.)], dtype=complex)
state = cudaq.State.from_data(c)

@cudaq.kernel
def kernel(vec: cudaq.State):
    q = cudaq.qvector(vec)

counts = cudaq.sample(kernel, state)

# Pass state as a parameter (for fp32 simulators)
c = np.array([1. / np.sqrt(2.) + 0j, 0., 0., 1. / np.sqrt(2.)], dtype=np.complex64)
state = cudaq.State.from_data(c)

@cudaq.kernel
def kernel(vec: cudaq.State):
    q = cudaq.qvector(vec)

counts = cudaq.sample(kernel, state)

#Pass state as a parameter (Precision-agnostic)
c = np.array([1. / np.sqrt(2.) + 0j, 0., 0., 1. / np.sqrt(2.)], dtype=cudaq.complex())
state = cudaq.State.from_data(c)

@cudaq.kernel
def kernel(vec: cudaq.State):
    q = cudaq.qvector(vec)

counts = cudaq.sample(kernel, state)


# Capture state (for fp64 simulators)
c = np.array([1. / np.sqrt(2.) + 0j, 0., 0., 1. / np.sqrt(2.)], dtype=complex)
state = cudaq.State.from_data(c)

@cudaq.kernel
def kernel():
    q = cudaq.qvector(state)

counts = cudaq.sample(kernel)

# Capture state (for fp32 simulators)
c = np.array([1. / np.sqrt(2.) + 0j, 0., 0., 1. / np.sqrt(2.)], dtype=np.complex64)
state = cudaq.State.from_data(c)

@cudaq.kernel
def kernel():
    q = cudaq.qvector(state)

counts = cudaq.sample(kernel)

# Pass state from one kernel to another
@cudaq.kernel
def bell():
    qubits = cudaq.qvector(2)
    h(qubits[0])
    cx(qubits[0], qubits[1])

state = cudaq.get_state(bell)

@cudaq.kernel
def kernel(initialState: cudaq.State):
    qubits = cudaq.qvector(initialState)

state2 = cudaq.get_state(kernel, state)

For library-mode / simulation we pass the state data along to NVQIR. For physical backends, we can replace runtime state data with the result of a circuit synthesis pass (like the current implementation in from_state(...).

The text was updated successfully, but these errors were encountered:

boschmitt · 2024-01-17T00:26:36Z

Thanks @amccaskey for proposing this.

I have a clarification question regarding the semantics of a cudaq::qvector's state. For example, what will be the return value of the following kernel?

__qpu__ bool foo() { 
  // Init from state vector 
  cudaq::qvector q = {0., 1., 0., 0.};
  return cudaq::mz(q[0]);
}

I see two possibilities:

It returns true.
- Rationale: Index 1 in the initializer list corresponds to state |1> (or, in binary, |0b01>---the state is interpreted as a number). If q[0] corresponds to the least significant (qu)bit and the state is interpreted as a number, then the state of q[0] is |0b1> and thus mz(q[0]) returns true.
It returns false:
- Rationale: Index 1 in the initializer list corresponds to state |0>|1> (or |0,1>---here I could have used the short syntax |01> but I want to make the point that this state should not be interpreted as a number, but as bitstring---or vector of bits). Hence q[0] is |0> and mz(q[0]) returns false.

Thinking a bit forward, it seems to me that the second option is more appropriate. Eventually, we can define a quantum integer type, say cudaq::qint, in which the state must be interpreted as a number:

__qpu__ bool foo() { 
  // Init from state vector 
  cudaq::qint q = {0., 1., 0., 0.};
  return cudaq::mz(q[0]);
}

In this case, the kernel must return true.

1tnguyen · 2024-01-17T02:11:01Z

To make the API future-proof, we could also consider adding an optional bit-ordering vector argument (similar to custatevec API).

cudaq::qvector q({0., 1., 0., 0.}, {0, 1}); => q[0] should be |1>
cudaq::qvector q({0., 1., 0., 0.}, {1, 0}); => q[1] should be |1>

The default when none provided could be one of those two endian conventions, e.g., LSB.

amccaskey · 2024-01-17T13:57:31Z

Thanks @amccaskey for proposing this.

I have a clarification question regarding the semantics of a cudaq::qvector's state. For example, what will be the return value of the following kernel?
__qpu__ bool foo() { 
  // Init from state vector 
  cudaq::qvector q = {0., 1., 0., 0.};
  return cudaq::mz(q[0]);
}
I see two possibilities:

It returns true.

Rationale: Index 1 in the initializer list corresponds to state |1> (or, in binary, |0b01>---the state is interpreted as a number). If q[0] corresponds to the least significant (qu)bit and the state is interpreted as a number, then the state of q[0] is |0b1> and thus mz(q[0]) returns true.

It returns false:

Rationale: Index 1 in the initializer list corresponds to state |0>|1> (or |0,1>---here I could have used the short syntax |01> but I want to make the point that this state should not be interpreted as a number, but as bitstring---or vector of bits). Hence q[0] is |0> and mz(q[0]) returns false.

Thinking a bit forward, it seems to me that the second option is more appropriate. Eventually, we can define a quantum integer type, say cudaq::qint, in which the state must be interpreted as a number:
__qpu__ bool foo() { 
  // Init from state vector 
  cudaq::qint q = {0., 1., 0., 0.};
  return cudaq::mz(q[0]);
}
In this case, the kernel must return true.

@boschmitt I prefer we go with bullet 2.

amccaskey · 2024-01-17T15:26:21Z

@boschmitt for your qint example, I was hoping to support cudaq::qint q = 4; instead of the initializer list. Do you foresee any gotchas there?

amccaskey · 2024-01-17T20:26:11Z

One thing to add, it will likely be good to update the cudaq::state definition to be backend specific, and allow it as input to a CUDA Quantum kernel. If it is backend specific, we can have the sub-type hold a GPU device pointer and avoid copying the large data vector from device to host.

__qpu__ void test4(const cudaq::state &state) {
  // Input state could wrap GPU device pointer 
  cudaq::qvector q = state;
  ... build off initial state ... 
}

void useTest4() {
  auto initStateGen = [](...) __qpu__ { ... }; 
  auto intState = cudaq::get_state(initStateGen, ...); 
  cudaq::sample(test4, initState).dump();
}

justinlietz · 2024-01-17T23:00:20Z

I was hoping to support cudaq::qint q = 4; instead of the initializer list. Do you foresee any gotchas there?

Would this be interpreted as the bitstring 1,0,0? You would need to know how many leading zeros are needed, so maybe an additional constructor parameter that is nQubits.

If the goal is to construct states restricted to the computational basis, I would think rather than qint we could add qvector(const std::vector<bool>&);. Here the vector is of length nQubits, rather than 2**nQubits, and the construction is just specified by the bitstring.

boschmitt · 2024-01-17T23:24:00Z

@boschmitt for your qint example, I was hoping to support cudaq::qint q = 4; instead of the initializer list. Do you foresee any gotchas there?

We can certainly support it, but we would still have to define what it means with respect to a state vector. There will be more question to answer in order to support this idea. For example:

How many qubits cudaq::qint q = 4 creates? A fixed number, say 8, or the minimum necessary to represent 4?
Would we allow users to easily access the qubits, e.g., using q[0]? If we do, what would q[0] return?
Would the user be able to create a cudaq::qint in which the state is a superposition of different integers ? If we allow, how the indices on the initializer list relate to the integers represented by the state?

Let me try to rephrase my questions: If we have a set of qubits we can try to initialize this set using a state vector, then the we need clarity on:

How does the index of the state vector relates to the state, e.g. given a 3 qubit state vector, does index 1 corresponds to to the state represented as bitstring |001>?
Depending on the type, e.g cudaq::vector of cudaq::qint, does the interpretation of |001> changes? For example, if the type is cudaq::qvector we interpret the state as |0, 0, 1> and q[0] state is |0>; if the type is cudaq::qint we interpret the state as |0b001> and q[0] is |1>.

amccaskey · 2024-01-18T13:15:00Z

@boschmitt for your qint example, I was hoping to support cudaq::qint q = 4; instead of the initializer list. Do you foresee any gotchas there?

We can certainly support it, but we would still have to define what it means with respect to a state vector. There will be more question to answer in order to support this idea. For example:

How many qubits cudaq::qint q = 4 creates? A fixed number, say 8, or the minimum necessary to represent 4?

Would we allow users to easily access the qubits, e.g., using q[0]? If we do, what would q[0] return?

Would the user be able to create a cudaq::qint in which the state is a superposition of different integers ? If we allow, how the indices on the initializer list relate to the integers represented by the state?

Let me try to rephrase my questions: If we have a set of qubits we can try to initialize this set using a state vector, then the we need clarity on:

How does the index of the state vector relates to the state, e.g. given a 3 qubit state vector, does index 1 corresponds to to the state represented as bitstring |001>?

Depending on the type, e.g cudaq::vector of cudaq::qint, does the interpretation of |001> changes? For example, if the type is cudaq::qvector we interpret the state as |0, 0, 1> and q[0] state is |0>; if the type is cudaq::qint we interpret the state as |0b001> and q[0] is |1>.

I guess qint may be a bit beyond this RFC, but to answer your first question - for qint we might want a template parameter for the size of the qubit register qint<N> and then typedefs for common ones.

boschmitt · 2024-01-18T17:26:19Z

I guess qint may be a bit beyond this RFC

I agree.

The main point for which I asked clarification is with regards of how the semantics of the state vector relates to the type, cudaq::qvector, and accessing individual qubits. I provided two takes on it and it seems there is a preference for the second. The cudaq::qint digression is just a thought experiment to see how our decision will stand the test of time and possible CUDA Quantum evolutions.

schweitzpgi · 2024-04-02T20:38:16Z

qubit initializer list

See PR #1461

amccaskey · 2024-04-10T12:17:11Z

@schweitzpgi I think we can probably start thinking about MLIR support and QIR lowering for a quake.state type to support

__qpu__ void kernel(cudaq::state inState) { 
  cudaq::qvector q = inState;
  ...
}

in anticipation of #1467. I think we can just treat this like Clang would and lower to a ptr and update the InitializeStateOp lowering to invoke a new NVQIR function.

1tnguyen · 2024-04-22T03:39:22Z

Some notes about the ownership semantics for cudaq::state after implementation experimentation in #1542 for discussion:

Currently, CircuitSimulator and SimulationState implementations often assume ownership of the underlying memory resources (exchanged at getSimulationState).
User-facing cudaq::state class (the result of get_state) would ideally hold the SimulationState in a shared ownership manner (to make passing the state around more conveniently + Python bindings, etc.)
Passing this cudaq::state back to a quantum kernel for qvector allocations can be implemented in a couple of ways:

(1) Adopting reference semantics
e.g.,

__qpu__ void kernel(cudaq::state inState) { 
  cudaq::qvector q{inState};
  ...
}
// The above would be equivalent to this.
__qpu__ void kernel1(cudaq::state& inState) { 
  cudaq::qvector q{inState};
  ...
}

auto myState = cudaq::get_state(some_kernel);
kernel(myState); // or  kernel1(myState);
// ==> myState is updated as a result of kernel execution

Simulators to cope with both ownership scenarios for the underlying data (e.g., qpp::ket, device memory, etc.) For example, subsequent getSimulationState may need to perform a copy if the current state is not owned by the simulator.
A referenced state that was involved in a sub-state allocation needs consideration:

__qpu__ void kernel(cudaq::state inState) { 
  cudaq::qvector my_vec(N); // default init 
  ...
  // Adding some qubits in a state
  cudaq::qvector q{inState};
  ...
}


auto myState = cudaq::get_state(some_kernel);
kernel(myState); 
// should myState be updated to reflect the whole simulator's state (+N qubits)
// or stay the same (i.e., the user needs to call a `get_state` explicitly to get the new state)?

(2) Adopting move semantics

The user needs to explicitly move the state to pass it to the simulator (giving it back to the simulator).

__qpu__ void kernel(cudaq::state&& inState) { 
  cudaq::qvector q{std::move(inState)};
  ...
}


auto myState = cudaq::get_state(some_kernel);
kernel(std::move(myState)); 
// User has passed the ownership of the state to the kernel.

We could (theoretically) also distinguish/support different qvector allocation signatures:

 qvector(cudaq::state &&initState) ==> move
 qvector(const cudaq::state &initState) => copy state (inside the simulator)
 qvector(cudaq::state initState) ==> copy state (by the state)

The user needs to call get_state afterward to get the new state (the state is moved out of the simulator back to the user).
The obvious downside is the boilerplate associated with std::move to make sure the state is passing around most efficiently.

schweitzpgi · 2024-04-23T18:38:26Z

Building on Thien's comment above on move semantics, the qvector class is itself not claiming any ownership over the state object. The qvector ctor does pass the state object to the execution manager.

For performance reasons, let the user decide what happens to the state object used in the qvector ctor.

Move semantics

This seems straightforward. The cudaq::state object is moved into the execution manager, not copied.

cudaq::state state = ...;
qvector q(std::move(state));
// the variable `state` is dead/invalid at this point

In this case, this code can be optimized a bit since state is dead and no reference counting or destructing need take place.

Reference copy semantics

If the cudaq::state class can be a "reference wrapper". In that case a "copy" is shallow and only copies the pointer. The data itself is fully shared and gets reclaimed when the last reference goes out-of-scope. This adds some overhead and possibly leaks state information in a less intuitive way. See the following example.

cudaq::state state = ...;
qvector q1(state);  // calls qvector(cudaq::state);
// the variable `state` still has a reference to the state information
...
// the `state` information, while it can clearly be referenced may have _changed_ in the code above
qvector q2(state); // Surprise? q2 does not have the same initial state as q1!

1tnguyen · 2024-04-23T18:58:29Z

In the updated code, we'd add the full set of qvector constructor signatures from a state, e.g.,

qvector(const cudaq::state &initState); 
qvector(cudaq::state &initState); 
qvector(cudaq::state &&initState);
qvector(cudaq::state initState);

In particular, the const & signature would propagate to the simulator and ask it to create its copy of the state.

In the above example, adding const would make the reference state constant (if it was the intent).

const cudaq::state state = ...;
qvector q1(state);  // calls qvector(const cudaq::state&);
// the simulator will make a copy of the state to do simulation
...
// the `state` information would still be the same
qvector q2(state);

annagrin · 2024-05-15T18:50:53Z

Would we like to support the following python cases?

# Passing np arrays as params
c = np.array(c, dtype=cudaq.complex())
@cudaq.kernel
def kernel(vec: np.array):
    q = cudaq.qvector(vec)

c = np.array(c, dtype=cudaq.complex())
@cudaq.kernel
def kernel(vec: np.ndarray):
    q = cudaq.qvector(vec)

c = np.array(c, dtype=cudaq.complex())
@cudaq.kernel
def kernel(vec: np.ndarray[any, complex]):
    q = cudaq.qvector(vec)

bettinaheim · 2024-08-07T08:01:21Z

Closing this - any remaining work is tracked separately.

amccaskey added RFC Request for Comments language Anything related to the CUDA Quantum language specification labels Jan 11, 2024

amccaskey assigned amccaskey, boschmitt, schweitzpgi, bettinaheim, anthony-santana, 1tnguyen, bmhowe23 and khalatepradnya Jan 11, 2024

amccaskey mentioned this issue Jan 12, 2024

[RFC] Library-mode and kernel_builder implementation of allocation with initialization #1090

Closed

6 tasks

amccaskey assigned justinlietz Jan 16, 2024

This was referenced Jan 22, 2024

from_state prepares incorrect state #819

Closed

[RFC] qubits with initial states #1110

Closed

bettinaheim added RFC-approved and removed RFC Request for Comments labels Apr 4, 2024

schweitzpgi mentioned this issue Apr 8, 2024

[features/qalloc] Error checking on number of elements in MLIR Verifier #1490

Merged

This was referenced Apr 15, 2024

[Draft] Add implementation of qvector initialization from state #1513

Closed

[Draft] Add implementation for qvector initialization from state #1514

Closed

This was referenced Apr 15, 2024

Support using complex numbers and lists in kernel functions #1516

Closed

Support using complex numbers and lists of complex numbers inside kernel functions #1518

Closed

Support using complex inside kernel functions #1550

Merged

This was referenced May 15, 2024

[python] qvector init from lists and arrays #1688

Merged

[Python] Qvector init from state (original) #1706

Closed

This was referenced May 24, 2024

[Python] Qvector init from state #1713

Merged

[python] add qalloc from state in kernel builder mode #1733

Merged

This was referenced May 31, 2024

Add python and cpp kernel mode example for Trotterization using quantum states #1746

Merged

Address missed CR comments on Trotter examples PR #1752

Merged

Fix conversion of state vectors at runtime #1755

Merged

schweitzpgi mentioned this issue Jun 10, 2024

Implement initialization of a single qubit from a cudaq::state object #1785

Open

bettinaheim added this to the release 0.8.0 milestone Jul 1, 2024

annagrin mentioned this issue Jul 5, 2024

State preparation after synthesis #1891

Merged

annagrin mentioned this issue Jul 19, 2024

Add error message about not synthesizing state pointers #1974

Merged

This was referenced Jul 29, 2024

State initialization feature and performance improvements related to state handling #1754

Merged

Support for complex numbers in quantum kernels #1605

Merged

sacpis mentioned this issue Aug 1, 2024

[RFC] Handle device pointer for state initialization #1982

Draft

bettinaheim closed this as completed Aug 7, 2024

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

[RFC] [Language] Quantum allocation with state initialization #1086

[RFC] [Language] Quantum allocation with state initialization #1086

amccaskey commented Jan 11, 2024 •

edited by bettinaheim

Loading

boschmitt commented Jan 17, 2024

1tnguyen commented Jan 17, 2024

amccaskey commented Jan 17, 2024

amccaskey commented Jan 17, 2024

amccaskey commented Jan 17, 2024

justinlietz commented Jan 17, 2024

boschmitt commented Jan 17, 2024

amccaskey commented Jan 18, 2024

boschmitt commented Jan 18, 2024

schweitzpgi commented Apr 2, 2024 •

edited

Loading

amccaskey commented Apr 10, 2024

1tnguyen commented Apr 22, 2024

schweitzpgi commented Apr 23, 2024 •

edited

Loading

1tnguyen commented Apr 23, 2024

annagrin commented May 15, 2024 •

edited

Loading

bettinaheim commented Aug 7, 2024

[RFC] [Language] Quantum allocation with state initialization #1086

[RFC] [Language] Quantum allocation with state initialization #1086

Comments

amccaskey commented Jan 11, 2024 • edited by bettinaheim Loading

C++:

Python

C++ Usage

Python usage

Vectors of complex or floating-point numbers

Lists

Numpy arrays

cudaq.State

boschmitt commented Jan 17, 2024

1tnguyen commented Jan 17, 2024

amccaskey commented Jan 17, 2024

amccaskey commented Jan 17, 2024

amccaskey commented Jan 17, 2024

justinlietz commented Jan 17, 2024

boschmitt commented Jan 17, 2024

amccaskey commented Jan 18, 2024

boschmitt commented Jan 18, 2024

schweitzpgi commented Apr 2, 2024 • edited Loading

amccaskey commented Apr 10, 2024

1tnguyen commented Apr 22, 2024

schweitzpgi commented Apr 23, 2024 • edited Loading

Move semantics

Reference copy semantics

1tnguyen commented Apr 23, 2024

annagrin commented May 15, 2024 • edited Loading

bettinaheim commented Aug 7, 2024

amccaskey commented Jan 11, 2024 •

edited by bettinaheim

Loading

schweitzpgi commented Apr 2, 2024 •

edited

Loading

schweitzpgi commented Apr 23, 2024 •

edited

Loading

annagrin commented May 15, 2024 •

edited

Loading