feat: Implement NTT and convolution functions for polynomial multiplication

weilycoder · weilycoder · commit ac1a6e030bca · 2025-11-07T09:14:15.000+08:00
diff --git a/test/convolution_mod.test.cpp b/test/convolution_mod.test.cpp
@@ -0,0 +1,23 @@
+#define PROBLEM "https://judge.yosupo.jp/problem/convolution_mod"
+
+#include "../weilycoder/poly/ntt_convolve.hpp"
+#include <iostream>
+#include <vector>
+using namespace std;
+using namespace weilycoder;
+
+int main() {
+  cin.tie(nullptr)->sync_with_stdio(false);
+  cin.exceptions(cin.failbit | cin.badbit);
+  size_t n, m;
+  cin >> n >> m;
+  vector<uint64_t> a(n), b(m);
+  for (size_t i = 0; i < n; ++i)
+    cin >> a[i];
+  for (size_t i = 0; i < m; ++i)
+    cin >> b[i];
+  auto c = ntt_convolve_32<998244353>(a, b);
+  for (size_t i = 0; i < n + m - 1; ++i)
+    cout << c[i] << " \n"[i + 1 == n + m - 1];
+  return 0;
+}
diff --git a/weilycoder/poly/ntt.hpp b/weilycoder/poly/ntt.hpp
@@ -0,0 +1,64 @@
+#ifndef WEILYCODER_POLY_NTT_HPP
+#define WEILYCODER_POLY_NTT_HPP
+
+#include "../number-theory/mod_utility.hpp"
+#include "../number-theory/primitive_root.hpp"
+#include "fft_utility.hpp"
+#include <cstdint>
+#include <vector>
+
+namespace weilycoder {
+/**
+ * @brief Number Theoretic Transform (NTT)
+ * @tparam mod The prime modulus
+ * @tparam inverse Whether to perform the inverse NTT
+ * @tparam bit32 Whether to use 32-bit modular multiplication
+ * @tparam root A primitive root modulo mod
+ * @param y The input/output vector to be transformed
+ */
+template <uint64_t mod, bool inverse = false, bool bit32 = false,
+          uint64_t root = prime_primitive_root<mod>()>
+void ntt(std::vector<uint64_t> &y) {
+  static_assert(is_prime(mod), "mod must be a prime");
+  fft_change(y);
+  size_t len = y.size();
+  if (len == 0 || (len & (len - 1)) != 0)
+    throw std::invalid_argument("Length of input vector must be a power of two");
+  if ((mod - 1) % len != 0)
+    throw std::invalid_argument(
+        "mod - 1 must be divisible by the length of input vector");
+  constexpr uint64_t g = inverse ? mod_pow<bit32>(root, mod - 2, mod) : root;
+  for (size_t h = 2; h <= len; h <<= 1) {
+    uint64_t wn = mod_pow<bit32>(g, (mod - 1) / h, mod);
+    for (size_t j = 0; j < len; j += h) {
+      uint64_t w = 1;
+      for (size_t k = j; k < j + (h >> 1); ++k) {
+        uint64_t u = y[k];
+        uint64_t t = mod_mul<bit32>(w, y[k + (h >> 1)], mod);
+        y[k] = mod_add<bit32>(u, t, mod);
+        y[k + (h >> 1)] = mod_sub<bit32>(u, t, mod);
+        w = mod_mul<bit32>(w, wn, mod);
+      }
+    }
+  }
+  if constexpr (inverse) {
+    uint64_t inv_len = mod_pow<bit32>(len, mod - 2, mod);
+    for (size_t i = 0; i < len; ++i)
+      y[i] = mod_mul<bit32>(y[i], inv_len, mod);
+  }
+}
+
+/**
+ * @brief Number Theoretic Transform (NTT) using 32-bit modular multiplication
+ * @tparam mod The prime modulus
+ * @tparam inverse Whether to perform the inverse NTT
+ * @tparam root A primitive root modulo mod
+ * @param y The input/output vector to be transformed
+ */
+template <uint64_t mod, bool inverse = false, uint64_t root = prime_primitive_root(mod)>
+void ntt_32(std::vector<uint64_t> &y) {
+  ntt<mod, inverse, true, root>(y);
+}
+} // namespace weilycoder
+
+#endif
diff --git a/weilycoder/poly/ntt_convolve.hpp b/weilycoder/poly/ntt_convolve.hpp
@@ -0,0 +1,31 @@
+#ifndef WEILYCODER_POLY_NTT_CONVOLVE_HPP
+#define WEILYCODER_POLY_NTT_CONVOLVE_HPP
+
+#include "ntt.hpp"
+#include <cstdint>
+
+namespace weilycoder {
+template <uint64_t mod, bool bit32 = false, uint64_t root = prime_primitive_root<mod>()>
+std::vector<uint64_t> ntt_convolve(std::vector<uint64_t> a, std::vector<uint64_t> b) {
+  size_t n = 1;
+  while (n < a.size() + b.size() - 1)
+    n <<= 1;
+  a.resize(n, 0);
+  b.resize(n, 0);
+  ntt<mod, false, bit32, root>(a);
+  ntt<mod, false, bit32, root>(b);
+  for (size_t i = 0; i < n; ++i)
+    a[i] = mod_mul<bit32>(a[i], b[i], mod);
+  ntt<mod, true, bit32, root>(a);
+  a.resize(a.size() + b.size() - 1);
+  return a;
+}
+
+template <uint64_t mod, uint64_t root = prime_primitive_root<mod>()>
+std::vector<uint64_t> ntt_convolve_32(std::vector<uint64_t> a,
+                                      std::vector<uint64_t> b) {
+  return ntt_convolve<mod, true, root>(a, b);
+}
+} // namespace weilycoder
+
+#endif