PennyLaneAI · xiaohanzai · Nov 6, 2024 · Nov 7, 2024 · Nov 7, 2024 · Nov 7, 2024
diff --git a/.github/CHANGELOG.md b/.github/CHANGELOG.md
@@ -2,6 +2,9 @@
 
 ### New features since last release
 
+* Add OpenMP support to `collapse` method in the `lightning.qubit` backend.
+  [(#986)](https://github.com/PennyLaneAI/pennylane-lightning/pull/986)
+
 * Add native N-controlled gates support to `lightning.gpu`'s single-GPU backend.
   [(#938)](https://github.com/PennyLaneAI/pennylane-lightning/pull/938)
 

diff --git a/pennylane_lightning/core/_version.py b/pennylane_lightning/core/_version.py
@@ -16,4 +16,4 @@
    Version number (major.minor.patch[-label])
 """
 
-__version__ = "0.40.0-dev4"
+__version__ = "0.40.0-dev5"
diff --git a/pennylane_lightning/core/src/simulators/lightning_qubit/StateVectorLQubit.hpp b/pennylane_lightning/core/src/simulators/lightning_qubit/StateVectorLQubit.hpp
@@ -695,9 +695,12 @@ class StateVectorLQubit : public StateVectorBase<PrecisionT, Derived> {
         // **__**__ for stride 2
         // ****____ for stride 4
         const std::size_t k = branch ? 0 : 1;
+#if defined(_OPENMP)
+#pragma omp parallel for collapse(2) default(none) shared(arr, half_section_size, stride, k)
+#endif
         for (std::size_t idx = 0; idx < half_section_size; idx++) {
-            const std::size_t offset = stride * (k + 2 * idx);
             for (std::size_t ids = 0; ids < stride; ids++) {
+                const std::size_t offset = stride * (k + 2 * idx);
                 arr[offset + ids] = {0., 0.};
             }
         }
@@ -716,6 +719,9 @@ class StateVectorLQubit : public StateVectorBase<PrecisionT, Derived> {
                     "vector has norm close to zero and can't be normalized");
 
         ComplexT inv_norm = 1. / norm;
+#if defined(_OPENMP)
+#pragma omp parallel for default(none) shared(arr, inv_norm)
+#endif
         for (std::size_t k = 0; k < BaseType::getLength(); k++) {
             arr[k] *= inv_norm;
         }