deepmodeling
diff --git a/‎source/module_base/fft/fft_term.cpp‎
Lines changed: 280 additions & 0 deletions b/‎source/module_base/fft/fft_term.cpp‎
Lines changed: 280 additions & 0 deletions
diff --git a/‎source/module_basis/module_pw/CMakeLists.txt‎
Lines changed: 2 additions & 0 deletions b/‎source/module_basis/module_pw/CMakeLists.txt‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎source/module_basis/module_pw/fft_base.cpp‎
Lines changed: 43 additions & 0 deletions b/‎source/module_basis/module_pw/fft_base.cpp‎
Lines changed: 43 additions & 0 deletions
@@ -0,0 +1,280 @@
+#include <cassert>
+#include "fft_temp.h"
+// #include "fft_cpu.h"
+#if defined(__CUDA)
+#include "fft_cuda.h"
+#endif
+#if defined(__ROCM)
+#include "fft_rcom.h"
+#endif
+#include "module_base/module_device/device.h"
+// #include "fft_gpu.h"
+FFT1::FFT1()
+{
+    fft_float = nullptr;
+    fft_double = nullptr;
+}
+FFT1::FFT1(std::string device_in,std::string precision_in)
+{
+    assert(device_in=="cpu" || device_in=="gpu");
+    assert(precision_in=="single" || precision_in=="double" || precision_in=="mixing");
+    this->device = device_in;
+    this->precision = precision_in;
+    if (device=="cpu")
+    {
+        fft_float = new FFT_CPU<float>();
+        fft_double = new FFT_CPU<double>();
+    }
+    else if (device=="gpu")
+    {        
+        #if defined(__ROCM)
+            fft_float = new FFT_RCOM<float>();
+            fft_double = new FFT_RCOM<double>();
+        #elif defined(__CUDA)
+            fft_float = new FFT_CUDA<float>();
+            fft_double = new FFT_CUDA<double>();
+        #endif
+    }
+}
+
+FFT1::~FFT1()
+{
+    if (fft_float!=nullptr)
+    {
+        delete fft_float;
+        fft_float=nullptr;
+    }
+    if (fft_double!=nullptr)
+    {
+        delete fft_double;
+        fft_double=nullptr;
+    }
+}
+
+void FFT1::set_device(std::string device_in)
+{
+    this->device = device_in;
+}
+
+void FFT1::set_precision(std::string precision_in)
+{
+    this->precision = precision_in;
+}
+void FFT1::setfft(std::string device_in,std::string precision_in)
+{
+    assert(device_in=="cpu" || device_in=="gpu");
+    assert(precision_in=="single" || precision_in=="double" || precision_in=="mixing");
+    this->device = device_in;
+    this->precision = precision_in;
+    if (device=="cpu")
+    {
+        fft_float = new FFT_CPU<float>();
+        fft_double = new FFT_CPU<double>();
+    }
+    else if (device=="gpu")
+    {      
+        #if defined(__ROCM)
+            fft_float = new FFT_RCOM<float>();
+            fft_double = new FFT_RCOM<double>();
+        #elif defined(__CUDA)
+            fft_float = new FFT_CUDA<float>();
+            fft_double = new FFT_CUDA<double>();
+        #endif
+    }
+}
+void FFT1::initfft(int nx_in, int ny_in, int nz_in, int lixy_in, int rixy_in, int ns_in, int nplane_in, 
+                     int nproc_in, bool gamma_only_in, bool xprime_in , bool mpifft_in)
+{
+    if (this->precision=="single")
+    {
+        float_flag = 1;
+    }
+    else if (this->precision=="double")
+    {
+        double_flag = 1;
+    }
+    else if (this->precision=="mixing")
+    {
+        float_flag = 1;
+        double_flag = 1;
+    }
+    if (float_flag)
+    {
+        fft_float->initfftmode(this->fft_mode);
+        fft_float->initfft(nx_in,ny_in,nz_in,lixy_in,rixy_in,ns_in,nplane_in,nproc_in,gamma_only_in,xprime_in,mpifft_in);
+    }
+    if (double_flag)
+    {
+        fft_double->initfftmode(this->fft_mode);
+        fft_double->initfft(nx_in,ny_in,nz_in,lixy_in,rixy_in,ns_in,nplane_in,nproc_in,gamma_only_in,xprime_in,mpifft_in);
+    }
+}
+void FFT1::initfftmode(int fft_mode_in)
+{
+    this->fft_mode = fft_mode_in;
+}
+
+void FFT1::setupFFT()
+{
+    if (double_flag)
+    {
+        fft_double->setupFFT();
+    }
+    if (float_flag)
+    {
+        fft_float->setupFFT();
+    }
+}
+
+void FFT1::clearFFT()
+{
+    if (double_flag)
+    {
+        fft_double->cleanFFT();
+    }
+    if (float_flag)
+    {
+        fft_float->cleanFFT();
+    }
+}
+void FFT1::clear()
+{
+    this->clearFFT();
+    if (float_flag)
+    {
+        fft_float->clear();
+    }
+    if (double_flag)
+    {
+        fft_double->clear();
+    }
+}
+// access the real space data
+template <>
+float* FFT1::get_rspace_data() const
+{
+    return fft_float->get_rspace_data();
+}
+
+template <>
+double* FFT1::get_rspace_data() const
+{
+    return fft_double->get_rspace_data();
+}
+template <>
+std::complex<float>* FFT1::get_auxr_data() const
+{
+    return fft_float->get_auxr_data();
+}
+template <>
+std::complex<double>* FFT1::get_auxr_data() const
+{
+    return fft_double->get_auxr_data();
+}
+template <>
+std::complex<float>* FFT1::get_auxg_data() const
+{
+    return fft_float->get_auxg_data();
+}
+template <>
+std::complex<double>* FFT1::get_auxg_data() const
+{
+    return fft_double->get_auxg_data();
+}
+template <>
+std::complex<float>* FFT1::get_auxr_3d_data() const
+{
+    return fft_float->get_auxr_3d_data();
+}
+template <>
+std::complex<double>* FFT1::get_auxr_3d_data() const
+{
+    return fft_double->get_auxr_3d_data();
+}
+template <>
+void FFT1::fftxyfor(std::complex<float>* in, std::complex<float>* out) const
+{
+    fft_float->fftxyfor(in,out);
+}
+
+template <>
+void FFT1::fftxyfor(std::complex<double>* in, std::complex<double>* out) const
+{
+    fft_double->fftxyfor(in,out);
+}
+
+template <>
+void FFT1::fftzfor(std::complex<float>* in, std::complex<float>* out) const
+{
+    fft_float->fftzfor(in,out);
+}
+template <>
+void FFT1::fftzfor(std::complex<double>* in, std::complex<double>* out) const
+{
+    fft_double->fftzfor(in,out);
+}
+
+template <>
+void FFT1::fftxybac(std::complex<float>* in, std::complex<float>* out) const
+{
+    fft_float->fftxybac(in,out);
+}
+template <>
+void FFT1::fftxybac(std::complex<double>* in, std::complex<double>* out) const
+{
+    fft_double->fftxybac(in,out);
+}
+
+template <>
+void FFT1::fftzbac(std::complex<float>* in, std::complex<float>* out) const
+{
+    fft_float->fftzbac(in,out);
+}
+template <>
+void FFT1::fftzbac(std::complex<double>* in, std::complex<double>* out) const
+{
+    fft_double->fftzbac(in,out);
+}
+template <>
+void FFT1::fftxyr2c(float* in, std::complex<float>* out) const
+{
+    fft_float->fftxyr2c(in,out);
+}
+template <>
+void FFT1::fftxyr2c(double* in, std::complex<double>* out) const
+{
+    fft_double->fftxyr2c(in,out);
+}
+
+template <>
+void FFT1::fftxyc2r(std::complex<float>* in, float* out) const
+{
+    fft_float->fftxyc2r(in,out);
+}
+template <>
+void FFT1::fftxyc2r(std::complex<double>* in, double* out) const
+{
+    fft_double->fftxyc2r(in,out);
+}
+
+template <>
+void  FFT1::fft3D_forward(const base_device::DEVICE_GPU* ctx, std::complex<float>* in, std::complex<float>* out) const
+{
+    fft_float->fft3D_forward(in, out);
+}
+
+template <>
+void  FFT1::fft3D_forward(const base_device::DEVICE_GPU* ctx, std::complex<double>* in, std::complex<double>* out) const
+{
+    fft_double->fft3D_forward(in, out);
+}
+template <>
+void  FFT1::fft3D_backward(const base_device::DEVICE_GPU* ctx, std::complex<float>* in, std::complex<float>* out) const
+{
+    fft_float->fft3D_backward(in, out);
+}
+template <>
+void  FFT1::fft3D_backward(const base_device::DEVICE_GPU* ctx, std::complex<double>* in, std::complex<double>* out) const
+{
+    fft_double->fft3D_backward(in, out);
+}
@@ -1,5 +1,7 @@
 list(APPEND objects
     fft.cpp
+    fft_base.cpp
+    fft_temp.cpp
     pw_basis.cpp
     pw_basis_k.cpp
     pw_basis_sup.cpp
 
@@ -0,0 +1,43 @@
+#include "fft_base.h"
+template <typename FPTYPE>
+FFT_BASE<FPTYPE>::FFT_BASE()
+{
+}
+template <typename FPTYPE>
+FFT_BASE<FPTYPE>::~FFT_BASE()
+{
+
+}
+template <typename FPTYPE>
+void FFT_BASE<FPTYPE>::initfft(int nx_in, int ny_in, int nz_in, int lixy_in, int rixy_in, int ns_in, int nplane_in, 
+				 int nproc_in, bool gamma_only_in, bool xprime_in, bool mpifft_in)
+{
+    this->gamma_only = gamma_only_in;
+    this->xprime = xprime_in;
+    this->fftnx = this->nx = nx_in;
+    this->fftny = this->ny = ny_in;
+    if (this->gamma_only)
+    {
+        if (xprime)
+            this->fftnx = int(nx / 2) + 1;
+        else
+            this->fftny = int(ny / 2) + 1;
+    }
+    this->nz = nz_in;
+    this->ns = ns_in;
+    this->lixy = lixy_in;
+    this->rixy = rixy_in;
+    this->nplane = nplane_in;
+    this->nproc = nproc_in;
+    this->mpifft = mpifft_in;
+    this->nxy = this->nx * this->ny;
+    this->fftnxy = this->fftnx * this->fftny;
+    const int nrxx = this->nxy * this->nplane;
+    const int nsz = this->nz * this->ns;
+    this->maxgrids = (nsz > nrxx) ? nsz : nrxx;
+}
+
+template FFT_BASE<float>::FFT_BASE();
+template FFT_BASE<double>::FFT_BASE();
+template FFT_BASE<float>::~FFT_BASE();
+template FFT_BASE<double>::~FFT_BASE();