diff --git a/CMakeLists.txt b/CMakeLists.txt
index 6564e15d..4509e872 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -22,6 +22,9 @@ if(BUILD_METAL)
     add_compile_options(-DMODMESH_METAL)
 endif()
 
+option(BUILD_CUDA "build with CUDA" OFF)
+message(STATUS "BUILD_CUDA: ${BUILD_CUDA}")
+
 option(USE_CLANG_TIDY "use clang-tidy" OFF)
 option(LINT_AS_ERRORS "clang-tidy warnings as errors" OFF)
 
diff --git a/Makefile b/Makefile
index 35df8a73..d674513f 100644
--- a/Makefile
+++ b/Makefile
@@ -24,6 +24,7 @@ DEBUG_SYMBOL ?= ON
 MODMESH_PROFILE ?= OFF
 BUILD_METAL ?= OFF
 BUILD_QT ?= ON
+BUILD_CUDA ?= OFF
 USE_CLANG_TIDY ?= OFF
 CMAKE_BUILD_TYPE ?= Release
 MAKE_PARALLEL ?= -j
@@ -89,6 +90,7 @@ CMAKE_CMD = cmake $(MODMESH_ROOT) \
 	-DDEBUG_SYMBOL=$(DEBUG_SYMBOL) \
 	-DBUILD_METAL=$(BUILD_METAL) \
 	-DBUILD_QT=$(BUILD_QT) \
+	-DBUILD_CUDA=$(BUILD_CUDA) \
 	-DUSE_CLANG_TIDY=$(USE_CLANG_TIDY) \
 	-DLINT_AS_ERRORS=ON \
 	-DMODMESH_PROFILE=$(MODMESH_PROFILE) \
diff --git a/cpp/modmesh/CMakeLists.txt b/cpp/modmesh/CMakeLists.txt
index a1d494bb..ce4e5525 100644
--- a/cpp/modmesh/CMakeLists.txt
+++ b/cpp/modmesh/CMakeLists.txt
@@ -30,6 +30,17 @@ if (BUILD_QT)
     find_package(Qt6 REQUIRED COMPONENTS 3DExtras)
 endif () # BUILD_QT
 
+if (BUILD_CUDA)
+    find_package(CUDA REQUIRED)
+    find_package(CUDAToolkit REQUIRED)
+    enable_language(CUDA)
+    if (TARGET CUDA::cufft)
+        message(STATUS "CUDA cuFFT available")
+    else ()
+        message(FATAL_ERROR "CUDA cuFFT not found")
+    endif ()
+endif () # BUILD_CUDA
+
 add_subdirectory(buffer)
 add_subdirectory(mesh)
 add_subdirectory(toggle)
@@ -135,6 +146,12 @@ else () # BUILD_QT
     )
 endif () # BUILD_QT
 
+if (BUILD_CUDA)
+    set_target_properties(modmesh_primary PROPERTIES LINKER_LANGUAGE CUDA)
+    target_compile_definitions(modmesh_primary PRIVATE BUILD_CUDA)
+    target_link_libraries(modmesh_primary PRIVATE CUDA::cudart CUDA::cufft)
+endif () # BUILD_CUDA
+
 set_target_properties(modmesh_primary PROPERTIES POSITION_INDEPENDENT_CODE ON)
 
 if (CLANG_TIDY_EXE AND USE_CLANG_TIDY)
diff --git a/cpp/modmesh/device/cuda/cuda_error_handle.hpp b/cpp/modmesh/device/cuda/cuda_error_handle.hpp
new file mode 100644
index 00000000..80ca6861
--- /dev/null
+++ b/cpp/modmesh/device/cuda/cuda_error_handle.hpp
@@ -0,0 +1,89 @@
+#pragma once
+
+/*
+ * Copyright (c) 2025, Alex Chiang <jyxemperor@gmail.com>
+ *
+ * Redistribution and use in source and binary forms, with or without
+ * modification, are permitted provided that the following conditions are met:
+ *
+ * - Redistributions of source code must retain the above copyright notice,
+ *   this list of conditions and the following disclaimer.
+ * - Redistributions in binary form must reproduce the above copyright notice,
+ *   this list of conditions and the following disclaimer in the documentation
+ *   and/or other materials provided with the distribution.
+ * - Neither the name of the copyright holder nor the names of its contributors
+ *   may be used to endorse or promote products derived from this software
+ *   without specific prior written permission.
+ *
+ * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
+ * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
+ * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+ * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE
+ * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
+ * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
+ * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
+ * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
+ * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
+ * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
+ * POSSIBILITY OF SUCH DAMAGE.
+ */
+
+#include <cuda.h>
+#include <cuda_runtime.h>
+#include <cufft.h>
+#include <stdio.h>
+
+#define CUDA_SAFE_CALL(err) __cudaSafeCall(err, __FILE__, __LINE__)
+#define CUFFT_SAFE_CALL(err) __cufftSafeCall(err, __FILE__, __LINE__)
+#define CUDA_GET_LAST_ERROR() __cudaCheckError(__FILE__, __LINE__)
+
+void inline __cudaSafeCall(cudaError_t err, const char * file, const int line)
+{
+    if (err != cudaSuccess)
+    {
+        printf("CUDA Error %d: %s.\n%s(%d)\n", (int)err, cudaGetErrorString(err), file, line);
+    }
+}
+
+void inline __cudaCheckError(const char * file, const int line)
+{
+    cudaError_t err = cudaDeviceSynchronize();
+    if (err != cudaSuccess)
+    {
+        printf("CUDA Error %d: %s.\n%s(%d)\n", (int)err, cudaGetErrorString(err), file, line);
+    }
+
+    err = cudaGetLastError();
+    if (err != cudaSuccess)
+    {
+        printf("CUDA Error %d: %s.\n%s(%d)\n", (int)err, cudaGetErrorString(err), file, line);
+    }
+}
+
+const inline char * __cufftResultToString(cufftResult err)
+{
+    switch (err)
+    {
+    case CUFFT_SUCCESS: return "CUFFT_SUCCESS.";
+    case CUFFT_INVALID_PLAN: return "CUFFT_INVALID_PLAN.";
+    case CUFFT_ALLOC_FAILED: return "CUFFT_ALLOC_FAILED.";
+    case CUFFT_INVALID_TYPE: return "CUFFT_INVALID_TYPE.";
+    case CUFFT_INVALID_VALUE: return "CUFFT_INVALID_VALUE.";
+    case CUFFT_INTERNAL_ERROR: return "CUFFT_INTERNAL_ERROR.";
+    case CUFFT_EXEC_FAILED: return "CUFFT_EXEC_FAILED.";
+    case CUFFT_SETUP_FAILED: return "CUFFT_SETUP_FAILED.";
+    case CUFFT_INVALID_SIZE: return "CUFFT_INVALID_SIZE.";
+    case CUFFT_UNALIGNED_DATA: return "CUFFT_UNALIGNED_DATA.";
+    default: return "CUFFT Unknown error code.";
+    }
+}
+
+void inline __cufftSafeCall(cufftResult err, const char * file, const int line)
+{
+    if (CUFFT_SUCCESS != err)
+    {
+        printf("CUFFT error %d: %s\n%s(%d)\n", (int)err, __cufftResultToString(err), file, line);
+    }
+}
+
+// vim: set ff=unix fenc=utf8 et sw=4 ts=4 sts=4:
diff --git a/cpp/modmesh/transform/CMakeLists.txt b/cpp/modmesh/transform/CMakeLists.txt
index 23249ad2..778e4685 100644
--- a/cpp/modmesh/transform/CMakeLists.txt
+++ b/cpp/modmesh/transform/CMakeLists.txt
@@ -5,6 +5,11 @@ set(MODMESH_TRANSFORM_HEADERS
     ${CMAKE_CURRENT_SOURCE_DIR}/fourier.hpp
     CACHE FILEPATH "" FORCE)
 
+if (BUILD_CUDA)
+    list(APPEND MODMESH_TRANSFORM_HEADERS
+        ${CMAKE_CURRENT_SOURCE_DIR}/fourier.cuh)
+endif()
+
 set(MODMESH_TRANSFORM_SOURCES
     ${CMAKE_CURRENT_SOURCE_DIR}/fourier.cpp
     CACHE FILEPATH "" FORCE)
diff --git a/cpp/modmesh/transform/fourier.cuh b/cpp/modmesh/transform/fourier.cuh
new file mode 100644
index 00000000..c4573af6
--- /dev/null
+++ b/cpp/modmesh/transform/fourier.cuh
@@ -0,0 +1,85 @@
+#pragma once
+
+/*
+ * Copyright (c) 2025, Alex Chiang <jyxemperor@gmail.com>
+ *
+ * Redistribution and use in source and binary forms, with or without
+ * modification, are permitted provided that the following conditions are met:
+ *
+ * - Redistributions of source code must retain the above copyright notice,
+ *   this list of conditions and the following disclaimer.
+ * - Redistributions in binary form must reproduce the above copyright notice,
+ *   this list of conditions and the following disclaimer in the documentation
+ *   and/or other materials provided with the distribution.
+ * - Neither the name of the copyright holder nor the names of its contributors
+ *   may be used to endorse or promote products derived from this software
+ *   without specific prior written permission.
+ *
+ * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
+ * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
+ * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+ * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE
+ * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
+ * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
+ * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
+ * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
+ * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
+ * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
+ * POSSIBILITY OF SUCH DAMAGE.
+ */
+
+#include <modmesh/modmesh.hpp>
+#include <modmesh/buffer/buffer.hpp>
+#include <modmesh/device/cuda/cuda_error_handle.hpp>
+
+#define FFT_CUDA_IMPL(CUFFT_DATA_TYPE, CUFFT_EXEC_TYPE)                                                    \
+{                                                                                                          \
+    cufftHandle plan;                                                                                      \
+    CUFFT_DATA_TYPE * host_in = nullptr;                                                                   \
+    CUFFT_DATA_TYPE * host_out = nullptr;                                                                  \
+    CUFFT_DATA_TYPE * device_in = nullptr;                                                                 \
+    CUFFT_DATA_TYPE * device_out = nullptr;                                                                \
+    host_in = (CUFFT_DATA_TYPE*)malloc(sizeof(CUFFT_DATA_TYPE) * N);                                       \
+    host_out = (CUFFT_DATA_TYPE*)malloc(sizeof(CUFFT_DATA_TYPE) * N);                                      \
+    for (size_t i = 0; i < N; ++i)                                                                         \
+    {                                                                                                      \
+        host_in[i].x = in[i].real();                                                                       \
+        host_in[i].y = in[i].imag();                                                                       \
+    }                                                                                                      \
+    CUDA_SAFE_CALL(cudaMalloc((void**)&device_in, sizeof(CUFFT_DATA_TYPE) * N));                           \
+    CUDA_SAFE_CALL(cudaMalloc((void**)&device_out, sizeof(CUFFT_DATA_TYPE) * N));                          \
+    CUDA_SAFE_CALL(cudaMemcpy(device_in, host_in, sizeof(CUFFT_DATA_TYPE) * N, cudaMemcpyHostToDevice));   \
+    CUFFT_SAFE_CALL(cufftPlan1d(&plan, N, CUFFT_##CUFFT_EXEC_TYPE, 1));                                    \
+    CUFFT_SAFE_CALL(cufftExec##CUFFT_EXEC_TYPE(plan, device_in, device_out, CUFFT_FORWARD));               \
+    CUDA_SAFE_CALL(cudaMemcpy(host_out, device_out, sizeof(CUFFT_DATA_TYPE) * N, cudaMemcpyDeviceToHost)); \
+    for (size_t i = 0; i < N; ++i)                                                                         \
+    {                                                                                                      \
+        out[i] = T1<T2>{ host_out[i].x, host_out[i].y };                                                   \
+    }                                                                                                      \
+    CUFFT_SAFE_CALL(cufftDestroy(plan));                                                                   \
+    CUDA_SAFE_CALL(cudaFree(device_in));                                                                   \
+    CUDA_SAFE_CALL(cudaFree(device_out));                                                                  \
+    free(host_in);                                                                                         \
+    free(host_out);                                                                                        \
+}
+
+namespace modmesh
+{
+
+template <template <typename> class T1, typename T2>
+void fft_cuda(SimpleArray<T1<T2>> const & in, SimpleArray<T1<T2>> & out)
+{
+    size_t N = in.size();
+    if constexpr (std::is_same_v<T2, float>)
+    {
+        FFT_CUDA_IMPL(cufftComplex, C2C)
+    }
+    else if constexpr (std::is_same_v<T2, double>)
+    {
+        FFT_CUDA_IMPL(cufftDoubleComplex, Z2Z)
+    }
+}
+
+} /* namespace modmesh */
+
+// vim: set ff=unix fenc=utf8 et sw=4 ts=4 sts=4:
diff --git a/cpp/modmesh/transform/fourier.hpp b/cpp/modmesh/transform/fourier.hpp
index a63926cb..c9555dd6 100644
--- a/cpp/modmesh/transform/fourier.hpp
+++ b/cpp/modmesh/transform/fourier.hpp
@@ -3,6 +3,10 @@
 #include <modmesh/math/math.hpp>
 #include <modmesh/buffer/buffer.hpp>
 
+#if defined(BUILD_CUDA)
+#include <modmesh/transform/fourier.cuh>
+#endif
+
 namespace modmesh
 {
 
@@ -63,22 +67,37 @@ class FourierTransform
     FourierTransform & operator=(FourierTransform && other) = delete;
 
     template <template <typename> class T1, typename T2>
-    static void fft(SimpleArray<T1<T2>> const & in, SimpleArray<T1<T2>> & out)
+    static void fft(SimpleArray<T1<T2>> const & in, SimpleArray<T1<T2>> & out, std::string const && backend)
     {
         const size_t N = in.size();
 
-        if ((N & (N - 1)) == 0)
+        if (backend == "cpu")
+        {
+            if ((N & (N - 1)) == 0)
+            {
+                detail::fft_radix_2<T1, T2>(in, out);
+            }
+            else
+            {
+                detail::fft_bluestein<T1, T2>(in, out);
+            }
+        }
+        else if (backend == "cuda")
         {
-            detail::fft_radix_2<T1, T2>(in, out);
+#if defined(BUILD_CUDA)
+            modmesh::fft_cuda<T1, T2>(in, out);
+#else
+            throw std::runtime_error("CUDA is not available.");
+#endif
         }
         else
         {
-            detail::fft_bluestein<T1, T2>(in, out);
+            throw std::runtime_error("unsupported backend.");
         }
     }
 
     template <template <typename> class T1, typename T2>
-    static void ifft(SimpleArray<T1<T2>> const & in, SimpleArray<T1<T2>> & out)
+    static void ifft(SimpleArray<T1<T2>> const & in, SimpleArray<T1<T2>> & out, std::string const && backend)
     {
         size_t N = in.size();
         SimpleArray<T1<T2>> in_conj{modmesh::small_vector<size_t>{N}, T1<T2>{0.0, 0.0}};
@@ -88,7 +107,7 @@ class FourierTransform
             in_conj[i] = in[i].conj();
         }
 
-        fft<T1, T2>(in_conj, out);
+        fft<T1, T2>(in_conj, out, std::move(backend));
 
         for (size_t i = 0; i < N; ++i)
         {
@@ -152,7 +171,7 @@ void fft_bluestein(SimpleArray<T1<T2>> const & in, SimpleArray<T1<T2>> & out)
         A[i] *= B[i];
     }
 
-    FourierTransform::ifft<T1, T2>(A, a);
+    FourierTransform::ifft<T1, T2>(A, a, "cpu");
 
     for (size_t i = 0; i < N; ++i)
     {
diff --git a/cpp/modmesh/transform/pymod/wrap_fourier.cpp b/cpp/modmesh/transform/pymod/wrap_fourier.cpp
index 42879a29..6f4db409 100644
--- a/cpp/modmesh/transform/pymod/wrap_fourier.cpp
+++ b/cpp/modmesh/transform/pymod/wrap_fourier.cpp
@@ -53,10 +53,10 @@ class MODMESH_PYTHON_WRAPPER_VISIBILITY WrapFourierTransform
         namespace py = pybind11; // NOLINT(misc-unused-alias-decls)
 
         (*this)
-            .def_static("fft", &wrapped_type::fft<modmesh::Complex, double>, py::arg("input"), py::arg("output"))
-            .def_static("fft", &wrapped_type::fft<modmesh::Complex, float>, py::arg("input"), py::arg("output"))
-            .def_static("ifft", &wrapped_type::ifft<modmesh::Complex, double>, py::arg("input"), py::arg("output"))
-            .def_static("ifft", &wrapped_type::ifft<modmesh::Complex, float>, py::arg("input"), py::arg("output"))
+            .def_static("fft", &wrapped_type::fft<modmesh::Complex, double>, py::arg("input"), py::arg("output"), py::arg("backend"))
+            .def_static("fft", &wrapped_type::fft<modmesh::Complex, float>, py::arg("input"), py::arg("output"), py::arg("backend"))
+            .def_static("ifft", &wrapped_type::ifft<modmesh::Complex, double>, py::arg("input"), py::arg("output"), py::arg("backend"))
+            .def_static("ifft", &wrapped_type::ifft<modmesh::Complex, float>, py::arg("input"), py::arg("output"), py::arg("backend"))
             .def_static("dft", &wrapped_type::dft<modmesh::Complex, double>, py::arg("input"), py::arg("output"))
             .def_static("dft", &wrapped_type::dft<modmesh::Complex, float>, py::arg("input"), py::arg("output"));
     }
diff --git a/gtests/CMakeLists.txt b/gtests/CMakeLists.txt
index 48e0aaec..0ab83226 100644
--- a/gtests/CMakeLists.txt
+++ b/gtests/CMakeLists.txt
@@ -39,6 +39,18 @@ target_link_libraries(
     GTest::gmock_main
 )
 
+if (BUILD_CUDA)
+    find_package(CUDA REQUIRED)
+    find_package(CUDAToolkit REQUIRED)
+    enable_language(CUDA)
+    target_link_libraries(
+        test_nopython
+        CUDA::cudart
+        CUDA::cufft
+    )
+    target_compile_definitions(test_nopython PRIVATE BUILD_CUDA)
+endif()
+
 include(GoogleTest)
 gtest_discover_tests(test_nopython)
 
diff --git a/gtests/test_nopython_transform.cpp b/gtests/test_nopython_transform.cpp
index 55ecd55d..66351a1b 100644
--- a/gtests/test_nopython_transform.cpp
+++ b/gtests/test_nopython_transform.cpp
@@ -148,9 +148,12 @@ TYPED_TEST_SUITE(InverseTest, TestTypes);
 
 TYPED_TEST(ParsevalTest, fft)
 {
-    modmesh::FourierTransform::fft<modmesh::Complex, typename TypeParam::Type>(this->signal, this->out);
-
+    modmesh::FourierTransform::fft<modmesh::Complex, typename TypeParam::Type>(this->signal, this->out, "cpu");
+    this->verify_parseval();
+#if defined(BUILD_CUDA)
+    modmesh::FourierTransform::fft<modmesh::Complex, typename TypeParam::Type>(this->signal, this->out, "cuda");
     this->verify_parseval();
+#endif
 }
 
 TYPED_TEST(ParsevalTest, dft)
@@ -162,9 +165,12 @@ TYPED_TEST(ParsevalTest, dft)
 
 TYPED_TEST(DeltaFunctionTest, fft)
 {
-    modmesh::FourierTransform::fft<modmesh::Complex, typename TypeParam::Type>(this->signal, this->out);
-
+    modmesh::FourierTransform::fft<modmesh::Complex, typename TypeParam::Type>(this->signal, this->out, "cpu");
     this->verify_delta_function();
+#if defined(BUILD_CUDA)
+    modmesh::FourierTransform::fft<modmesh::Complex, typename TypeParam::Type>(this->signal, this->out, "cuda");
+    this->verify_delta_function();
+#endif
 }
 
 TYPED_TEST(DeltaFunctionTest, dft)
@@ -176,18 +182,29 @@ TYPED_TEST(DeltaFunctionTest, dft)
 
 TYPED_TEST(InverseTest, fft)
 {
-    modmesh::FourierTransform::fft<modmesh::Complex, typename TypeParam::Type>(this->signal, this->freq_domain);
-    modmesh::FourierTransform::ifft<modmesh::Complex, typename TypeParam::Type>(this->freq_domain, this->time_domain);
-
+    modmesh::FourierTransform::fft<modmesh::Complex, typename TypeParam::Type>(this->signal, this->freq_domain, "cpu");
+    modmesh::FourierTransform::ifft<modmesh::Complex, typename TypeParam::Type>(this->freq_domain, this->time_domain, "cpu");
     this->verify_inverse_fft_function();
+#if defined(BUILD_CUDA)
+    modmesh::FourierTransform::fft<modmesh::Complex, typename TypeParam::Type>(this->signal, this->freq_domain, "cuda");
+    modmesh::FourierTransform::ifft<modmesh::Complex, typename TypeParam::Type>(this->freq_domain, this->time_domain, "cuda");
+    this->verify_inverse_fft_function();
+#endif
 }
 
 TYPED_TEST(InverseTest, dft)
 {
     modmesh::FourierTransform::dft<modmesh::Complex, typename TypeParam::Type>(this->signal, this->freq_domain);
-    modmesh::FourierTransform::ifft<modmesh::Complex, typename TypeParam::Type>(this->freq_domain, this->time_domain);
-
+    modmesh::FourierTransform::ifft<modmesh::Complex, typename TypeParam::Type>(this->freq_domain, this->time_domain, "cpu");
     this->verify_inverse_fft_function();
+#if defined(BUILD_CUDA)
+    // output buffer must be zero-initialized before calling dft
+    for (size_t i = 0; i < this->freq_domain.size(); ++i)
+        this->freq_domain[i] = {0.0, 0.0};
+    modmesh::FourierTransform::dft<modmesh::Complex, typename TypeParam::Type>(this->signal, this->freq_domain);
+    modmesh::FourierTransform::ifft<modmesh::Complex, typename TypeParam::Type>(this->freq_domain, this->time_domain, "cuda");
+    this->verify_inverse_fft_function();
+#endif
 }
 
 // vim: set ff=unix fenc=utf8 et sw=4 ts=4 sts=4:
diff --git a/tests/test_transform.py b/tests/test_transform.py
index ca14e508..3a3c02f0 100644
--- a/tests/test_transform.py
+++ b/tests/test_transform.py
@@ -70,7 +70,7 @@ def test_numpy_fft_comparison(self):
         np_input = np.array(mm_input, copy=False)
 
         mm_output = self.SimpleArray(input_size, self.complex())
-        mm.FourierTransform.fft(mm_input, mm_output)
+        mm.FourierTransform.fft(mm_input, mm_output, "cpu")
 
         np_output = np.fft.fft(np_input)
 
@@ -88,7 +88,7 @@ def test_numpy_ifft_comparison(self):
         np_input = np.array(mm_input, copy=False)
 
         mm_output = self.SimpleArray(input_size, self.complex())
-        mm.FourierTransform.ifft(mm_input, mm_output)
+        mm.FourierTransform.ifft(mm_input, mm_output, "cpu")
 
         np_output = np.fft.ifft(np_input)