#pragma once
#include "../../../fps/bostan_mori/lib.hpp"
#include "../berlekamp_massey/lib.hpp"
namespace tifa_libs {
template <class poly, std::same_as<TPN poly::val_t> mint>
CEXP mint nth_term_lrec(u64 n, vec<mint> CR a, vec<mint> CR bm) NE {
if (n < a.size()) return a[n];
assert(!bm.empty() && bm[0] == 1);
poly q(bm);
q.strip();
return bostan_mori(n, (poly(a) * q).pre((u32)q.size() - 1), q);
}
template <class poly, std::same_as<TPN poly::val_t> mint>
CEXP mint nth_term_lrec(u64 n, vec<mint> CR a) NE {
if (n < a.size()) return a[n];
auto bm = berlekamp_massey(a);
return nth_term_lrec<poly, mint>(n, a, bm);
}
} // namespace tifa_libs
#line 2 "src/math/lrec/nth_term/lib.hpp"
#line 2 "src/fps/bostan_mori/lib.hpp"
#line 2 "src/conv/trans/ntt_doubling/lib.hpp"
#line 2 "src/math/qpow/basic/lib.hpp"
#line 2 "src/util/alias/num/lib.hpp"
#line 2 "src/util/util/lib.hpp"
// https://github.com/Tiphereth-A/CP-lib
#include <bits/extc++.h>
// clang-format off
namespace tifa_libs {
#define CEXP constexpr
#define CEXPE constexpr explicit
#define CR const&
#define CP const*
#define PC *const
#define CPC const*const
#define TPN typename
#define NE noexcept
#define CNE const noexcept
#define ND [[nodiscard]]
#define cT_(...) std::conditional_t<sizeof(__VA_ARGS__) <= sizeof(size_t) * 2, __VA_ARGS__, __VA_ARGS__ CR>
// NOLINTNEXTLINE(misc-const-correctness)
#define flt_(T, i, l, r, ...) for (T i = (l), i##e = (r)__VA_OPT__(, ) __VA_ARGS__; i < i##e; ++i)
#define retif_(cond, if_true, ...) if cond return if_true __VA_OPT__(; else return __VA_ARGS__)
#ifdef ONLINE_JUDGE
#undef assert
#define assert(x) 42
#endif
using namespace std::ranges;
using namespace std::literals;
template <class T>
CEXP T abs(T x) NE { retif_((x < 0), -x, x); }
} // namespace tifa_libs
// clang-format on
#line 4 "src/util/alias/num/lib.hpp"
// clang-format off
namespace tifa_libs {
#define mk0_(w, t) using w = t; using c##w = const t
#define mk_(w, t) mk0_(w, t); CEXP w operator""_##w(unsigned long long x) NE { return (w)x; }
mk_(i8, int8_t) mk_(u8, uint8_t) mk_(i16, int16_t) mk_(u16, uint16_t) mk_(i32, int32_t) mk_(u32, uint32_t) mk_(i64, int64_t) mk_(u64, uint64_t) mk_(isz, ssize_t) mk_(usz, size_t) mk_(chr, char) mk_(schr, signed char) mk_(uchr, unsigned char) mk_(sint, signed) mk_(uint, unsigned);
mk0_(i128, __int128_t); mk0_(u128, __uint128_t); mk0_(f32, float); mk0_(f64, double); mk0_(f128, long double);
#undef mk0_
#undef mk_
} // namespace tifa_libs
// clang-format on
#line 4 "src/math/qpow/basic/lib.hpp"
namespace tifa_libs {
template <class T>
CEXP T qpow(T a, u64 b, cT_(T) init_v = T{1}) NE {
T res = init_v;
for (; b; b >>= 1, a = a * a) {
while (!(b & 1)) b >>= 1, a = a * a;
res = res * a;
}
return res;
}
} // namespace tifa_libs
#line 2 "src/util/alias/others/lib.hpp"
#line 2 "src/util/consts/lib.hpp"
#line 4 "src/util/consts/lib.hpp"
// clang-format off
namespace tifa_libs {
using std::numbers::pi_v;
template <std::floating_point FP>
inline FP eps_v = std::sqrt(std::numeric_limits<FP>::epsilon());
template <std::floating_point FP>
CEXP void set_eps(FP v) NE { eps_v<FP> = v; }
CEXP u32 TIME = ((__TIME__[0] & 15) << 20) | ((__TIME__[1] & 15) << 16) | ((__TIME__[3] & 15) << 12) | ((__TIME__[4] & 15) << 8) | ((__TIME__[6] & 15) << 4) | (__TIME__[7] & 15);
CEXP auto STR2U16 = [] { std::array<u32, 65536> table{}; table.fill(-1_u32); flt_ (u32, i, 48, 58) flt_ (u32, j, 48, 58) table[i << 8 | j] = (j & 15) * 10 + (i & 15); return table; }();
inline const auto fn_0 = [](auto&&...) NE {};
inline const auto fn_is0 = [](auto x) NE { return x == 0; };
} // namespace tifa_libs
// clang-format on
#line 4 "src/util/alias/others/lib.hpp"
namespace tifa_libs {
template <class T>
struct chash {
CEXP static u64 C = u64(pi_v<f128> * 2e18) | 71;
CEXP u64 operator()(T x) CNE { return __builtin_bswap64(((u64)x ^ TIME) * C); }
};
// clang-format off
#define mk_(w, t) using w = t; using c##w = const t;
mk_(strn, std::string) mk_(strnv, std::string_view)
#undef mk_
template <class T> struct edge_t { T w; u32 u, v; CEXP auto operator<=>(edge_t CR) const = default; }; template <class T> using cedge_t = const edge_t<T>;
template <class T> struct pt3 { T _0, _1, _2; CEXP auto operator<=>(pt3 CR) const = default; }; template <class T> using cpt3 = const pt3<T>;
template <class T> struct pt4 { T _0, _1, _2, _3; CEXP auto operator<=>(pt4 CR) const = default; }; template <class T> using cpt4 = const pt4<T>;
#define mkT_(w, t, ...) template <class T> using w = t __VA_OPT__(, ) __VA_ARGS__; template <class T> using c##w = const t __VA_OPT__(, ) __VA_ARGS__;
mkT_(ptt, std::pair<T, T>) mkT_(alc, std::pmr::polymorphic_allocator<T>) mkT_(vec, std::vector<T>) mkT_(vvec, vec<vec<T>>) mkT_(v3ec, vvec<vec<T>>) mkT_(vecpt, vec<ptt<T>>) mkT_(vvecpt, vvec<ptt<T>>) mkT_(ptvec, ptt<vec<T>>) mkT_(ptvvec, ptt<vvec<T>>)
#undef mkT_
template <class T> using itl = std ::initializer_list<T>;
template <class T, usz ext = std::dynamic_extent> using spn = std::span<T const, ext>;
template <class T, usz N> using arr = std::array<T, N>; template <class T, usz N> using carr = std::array<const T, N>;
template <class U, class T> using vecp = vec<std::pair<U, T>>; template <class U, class T> using vvecp = vvec<std::pair<U, T>>;
template <class U, class T> using vvecp = vvec<std::pair<U, T>>; template <class U, class T> using vvvecp = vvec<vvec<std::pair<U, T>>>;
#ifdef PB_DS_ASSOC_CNTNR_HPP
template <class T, class C = std::less<T>> using set = __gnu_pbds::tree<T, __gnu_pbds::null_type, C>;
template <class K, class V, class C = std::less<K>> using map = __gnu_pbds::tree<K, V, C>;
// hset<u64> s({}, {}, {}, {}, {1<<16});
template <class T, class HF = chash<T>> using hset = __gnu_pbds::gp_hash_table<T, __gnu_pbds::null_type, HF>;
// hmap<u64, int> s({}, {}, {}, {}, {1<<16});
template <class K, class V, class HF = chash<K>> using hmap = __gnu_pbds::gp_hash_table<K, V, HF>;
#else
using std::set, std::map;
template <class T, class HF = chash<T>> using hset = std::unordered_set<T, HF>;
template <class K, class V, class HF = chash<K>> using hmap = std::unordered_map<K, V, HF>;
#endif
#ifdef PB_DS_PRIORITY_QUEUE_HPP
template <class T, class C = std::less<T>> using pq = __gnu_pbds::priority_queue<T, C>;
#else
template <class T, class C = std::less<T>> using pq = std::priority_queue<T, vec<T>, C>;
#endif
template <class T> using pqg = pq<T, std::greater<T>>;
// clang-format on
#define mk1_(V, A, T) using V##A = V<T>;
#define mk_(V, A, T) mk1_(V, A, T) mk1_(c##V, A, T)
#define mk(A, T) mk_(edge_t, A, T) mk_(ptt, A, T) mk_(pt3, A, T) mk_(pt4, A, T) mk_(vec, A, T) mk_(vvec, A, T) mk_(v3ec, A, T) mk_(vecpt, A, T) mk_(vvecpt, A, T) mk_(ptvec, A, T) mk_(ptvvec, A, T) mk1_(spn, A, T) mk1_(itl, A, T)
mk(b, bool) mk(c, chr) mk(i, i32) mk(u, u32) mk(ii, i64) mk(uu, u64) mk(t, isz) mk(z, usz) mk(f, f32) mk(d, f64) mk(s, strn);
#undef mk
#undef mk_
#undef mk1_
} // namespace tifa_libs
#line 2 "src/util/traits/math/lib.hpp"
// clang-format off
#line 4 "src/util/traits/math/lib.hpp"
namespace tifa_libs {
template <class T> concept char_c = std::same_as<T, char> || std::same_as<T, signed char> || std::same_as<T, unsigned char>;
#pragma GCC diagnostic ignored "-Wpedantic"
template <class T> concept s128_c = std::same_as<T, __int128_t> || std::same_as<T, __int128>;
template <class T> concept u128_c = std::same_as<T, __uint128_t> || std::same_as<T, unsigned __int128>;
template <class T> concept i128_c = s128_c<T> || u128_c<T>;
#pragma GCC diagnostic warning "-Wpedantic"
template <class T> concept imost64_c = std::integral<T> && sizeof(T) * __CHAR_BIT__ <= 64;
template <class T> concept smost64_c = imost64_c<T> && std::signed_integral<T>;
template <class T> concept umost64_c = imost64_c<T> && std::unsigned_integral<T>;
template <class T> concept int_c = i128_c<T> || imost64_c<T>;
template <class T> concept sint_c = s128_c<T> || smost64_c<T>;
template <class T> concept uint_c = u128_c<T> || umost64_c<T>;
template <class T> concept arithm_c = std::is_arithmetic_v<T> || int_c<T>;
template <class T> concept mint_c = requires(T x) { {x.mod()} -> uint_c; {x.val()} -> uint_c; };
template <class T> concept dft_c = requires(T x, std::vector<TPN T::data_t> v, u32 n) { {x.size()} -> std::same_as<u32>; x.bzr(n); x.dif(v, n); x.dit(v, n); };
template <class T> concept ntt_c = dft_c<T> && requires(T x) { T::max_size; T::G; };
template <class T> struct to_sint : std::make_signed<T> {};
template <> struct to_sint<u128> { using type = i128; };
template <> struct to_sint<i128> { using type = i128; };
template <class T> using to_sint_t = TPN to_sint<T>::type;
template <class T> struct to_uint : std::make_unsigned<T> {};
template <> struct to_uint<u128> { using type = u128; };
template <> struct to_uint<i128> { using type = u128; };
template <class T> using to_uint_t = TPN to_uint<T>::type;
template <arithm_c T> struct to_bigger : std::make_unsigned<T> {};
#define _(w,ww) template <> struct to_bigger<w> { using type = ww; }
#define _2(w,ww) _(i##w,i##ww); _(u##w,u##ww);
_2(8, 16); _2(16, 32); _2(32, 64); _2(64, 128); _(f32, f64); _(f64, f128);
#undef _2
#undef _
template <class T> using to_bigger_t = TPN to_bigger<T>::type;
template <arithm_c T> CEXP T inf_v = [] {
if CEXP(sint_c<T>) return T(to_uint_t<T>(-1) / 4 - 1);
else if CEXP(uint_c<T>) return T(-1) / 2 - 1;
else return std::numeric_limits<T>::max() / 2 - 1;
}();
} // namespace tifa_libs
// clang-format on
#line 6 "src/conv/trans/ntt_doubling/lib.hpp"
namespace tifa_libs {
template <ntt_c NTT_t, std::same_as<TPN NTT_t::data_t> mint>
CEXP void ntt_doubling(NTT_t CR ntt, vec<mint>& f, u32 n = 0) NE {
if (!n) n = (u32)f.size() / 2;
assert(std::has_single_bit(n) && f.size() >= n * 2);
vec<mint> g(begin(f), begin(f) + n);
ntt.dit(g);
mint r = 1;
const mint zeta = qpow(ntt.G, (mint::mod() - 1) / (n * 2));
flt_ (u32, i, 0, n) g[i] *= r, r *= zeta;
ntt.dif(g), copy(g, begin(f) + n);
}
} // namespace tifa_libs
#line 2 "src/fps/ds/poly_c/lib.hpp"
#line 2 "src/util/strip/lib.hpp"
#line 4 "src/util/strip/lib.hpp"
namespace tifa_libs {
// pred(x) == true ==> drop
template <common_range R, class F>
CEXP auto lstrip_view(R CR range, F&& pred) NE {
auto v = range | views::drop_while(std::forward<F>(pred));
return subrange{begin(v), end(v)};
}
// pred(x) == true ==> drop
template <common_range R, class F>
CEXP auto rstrip_view(R CR range, F&& pred) NE {
auto v = range | views::reverse | views::drop_while(std::forward<F>(pred));
return subrange{end(v).base(), begin(v).base()};
}
// pred(x) == true ==> drop
template <common_range R, class F>
CEXP auto strip_view(R CR range, F&& pred) NE {
auto v = range | views::drop_while(std::forward<F>(pred)) | views::reverse | views::drop_while(std::forward<F>(pred));
return subrange{end(v).base(), begin(v).base()};
}
} // namespace tifa_libs
#line 2 "src/util/traits/others/lib.hpp"
// clang-format off
#line 4 "src/util/traits/others/lib.hpp"
namespace tifa_libs {
//! only for template without non-type argument
template <class, template <class...> class> CEXP bool specialized_from_v = false;
template <template <class...> class T, class... Args> CEXP bool specialized_from_v<T<Args...>, T> = true;
static_assert(specialized_from_v<vecu, std::vector>);
template <class T> concept container_c = common_range<T> && !std::is_array_v<std::remove_cvref_t<T>> && !std::same_as<std::remove_cvref_t<T>, strn> && !std::same_as<std::remove_cvref_t<T>, strnv>;
template <class T> concept istream_c = std::derived_from<T, std::istream> || std::derived_from<T, std::wistream> || requires(T is) { is.peek(); };
template <class T> concept ostream_c = std::derived_from<T, std::ostream> || std::derived_from<T, std::wostream> || requires(T os) { os.flush(); };
} // namespace tifa_libs
// clang-format on
#line 5 "src/fps/ds/poly_c/lib.hpp"
namespace tifa_libs {
// clang-format off
enum class CCORE : u8 { FFT_R2, NTT3, NTT };
// clang-format on
namespace poly_impl_ {
template <class ccore>
requires requires(ccore cc, vec<TPN ccore::val_t> l, vec<TPN ccore::val_t> r, u32 sz) {
{ ccore::ct_cat } -> std::same_as<CCORE CR>;
cc.conv(l, r), cc.conv(l, r, sz);
}
struct poly : vec<TPN ccore::val_t> {
using ccore_t = ccore;
using val_t = ccore_t::val_t;
using data_t = vec<val_t>;
static inline ccore_t conv_core;
CEXPE poly(u32 sz = 1, cT_(val_t) val = val_t{}) NE : data_t(sz, val) {}
CEXP poly(TPN data_t::const_iterator begin, TPN data_t::const_iterator end) NE : data_t(begin, end) {}
CEXP poly(data_t CR v) NE : data_t(v) {}
CEXP poly(data_t&& v) NE : data_t(std::move(v)) {}
CEXP poly(itl<val_t> v) NE : data_t(v) {}
CEXP poly(common_range auto CR v) NE : data_t(begin(v), end(v)) {}
friend CEXP auto& operator>>(istream_c auto& is, poly& poly) NE {
for (auto& val : poly) is >> val;
return is;
}
friend CEXP auto& operator<<(ostream_c auto& os, poly CR poly) NE {
retif_((!poly.size()) [[unlikely]], os);
flt_ (u32, i, 1, (u32)poly.size()) os << poly[i - 1] << ' ';
return os << poly.back();
}
ND CEXP bool is_zero() CNE {
for (auto&& i : *this)
if (i != 0) return false;
return true;
}
CEXP val_t operator()(val_t x) CNE {
val_t ans = 0;
for (u32 i = data_t::size() - 1; ~i; --i) ans = ans * x + data_t::data()[i];
return ans;
}
template <class F>
requires requires(F f, u32 idx, val_t& val) { f(idx, val); }
CEXP void apply_range(u32 l, u32 r, F&& f) NE {
assert(l < r && r <= data_t::size());
flt_ (u32, i, l, r) f(i, data_t::data()[i]);
}
template <class F>
CEXP void apply(F&& f) NE { apply_range(0, (u32)data_t::size(), std::forward<F>(f)); }
ND CEXP poly pre(u32 sz) CNE {
if (sz <= this->size()) return {this->begin(), this->begin() + sz};
poly _ = *this;
_.resize(sz);
return _;
}
CEXP void strip() NE {
auto [_, r] = rstrip_view(*this, [](cT_(val_t) x) NE { return x.val() == 0; });
if (data_t::erase(r, this->end()); data_t::empty()) data_t::push_back(val_t(0));
}
friend poly stripped(poly CR p) NE {
poly ret(rstrip_view(p, [](cT_(val_t) x) NE { return x.val() == 0; }));
if (ret.empty()) return {0};
return ret;
}
CEXP void reverse(u32 n = 0) NE { std::ranges::reverse(data_t::begin(), data_t::begin() + (n ? n : (u32)data_t::size())); }
CEXP void conv(poly CR r, u32 ans_size = 0) NE { conv_core.conv(*this, r, ans_size); }
CEXP poly operator-() CNE {
poly ret = *this;
ret.apply([](u32, auto& v) NE { v = -v; });
return ret;
}
friend CEXP poly operator+(poly p, val_t c) NE {
p[0] += c;
return p;
}
friend CEXP poly operator+(val_t c, poly CR p) NE { return p + c; }
friend CEXP poly operator-(poly p, val_t c) NE {
p[0] -= c;
return p;
}
friend CEXP poly operator-(val_t c, poly CR p) NE { return p - c; }
CEXP poly& operator*=(val_t c) NE {
apply([&c](u32, auto& v) NE { v *= c; });
return *this;
}
friend CEXP poly operator*(poly p, val_t c) NE { return p *= c; }
friend CEXP poly operator*(val_t c, poly p) NE { return p *= c; }
CEXP poly& operator+=(poly CR r) NE {
retif_((r.empty()) [[unlikely]], *this);
data_t::resize(max(data_t::size(), r.size())), apply_range(0, (u32)r.size(), [&r](u32 i, auto& v) NE { v += r[i]; });
return *this;
}
friend CEXP poly operator+(poly l, poly CR r) NE { return l += r; }
CEXP poly& operator-=(poly CR r) NE {
retif_((r.empty()) [[unlikely]], *this);
data_t::resize(max(data_t::size(), r.size()));
apply_range(0, (u32)r.size(), [&r](u32 i, auto& v) NE { v -= r[i]; });
return *this;
}
friend CEXP poly operator-(poly l, poly CR r) NE { return l -= r; }
CEXP poly& operator*=(poly CR r) NE {
if (r.empty()) {
data_t::resize(1), *data_t::data() = 0;
return *this;
}
conv(r);
return *this;
}
friend CEXP poly operator*(poly l, poly CR r) NE { return l *= r; }
CEXP auto operator<=>(poly CR r) CNE {
auto l_ = stripped(*this), r_ = stripped(r);
if (l_.size() != r_.size()) return l_.size() <=> r_.size();
return std::lexicographical_compare_three_way(l_.rbegin(), l_.rend(), r_.rbegin(), r_.rend());
}
CEXP bool operator==(poly CR r) CNE { return std::is_eq(*this <=> r); }
};
} // namespace poly_impl_
template <class T>
concept poly_c = std::same_as<T, poly_impl_::poly<TPN T::ccore_t>>;
} // namespace tifa_libs
#line 5 "src/fps/bostan_mori/lib.hpp"
namespace tifa_libs {
namespace bostan_mori_impl_ {
template <class ccore_t, class T>
vec<T> coeff_(ccore_t CR core, ccore_t CR core2, vec<T>& q, u64 n, u32 d) NE {
cu32 len = core.size();
vec<T> s(len * 2);
if (!n) {
vec<T> res(d);
res.back() = len * std::reduce(q.begin(), q.begin() + len, T(0)).inv();
return res;
}
ntt_doubling(core, q, len);
vec<T> a(len * 2);
flt_ (u32, i, len / 2, len) a[i * 2 + 1] = a[i * 2] = q[i * 2] * q[i * 2 + 1];
flt_ (u32, i, 0, len) a[i] = q[i * 2] * q[i * 2 + 1];
vec<T> w = coeff_(core, core2, a, n / 2, d);
s = vec<T>(len * 2);
for (u32 i = (n & 1) ^ 1, j = 0; j < d; ++j, i += 2) s[i] = w[j];
core2.dif(s);
flt_ (u32, i, 0, len * 2) s[i] *= q[i ^ 1];
core2.dit(s);
return vec<T>(begin(s) + d, begin(s) + d * 2);
}
} // namespace bostan_mori_impl_
// @return [x^k]p/q
template <poly_c poly_t>
CEXP auto bostan_mori(u64 n, poly_t CR p, poly_t CR q) NE {
if CEXP (assert(p.size() == q.size() - 1 && !p.is_zero()); poly_t::ccore_t::ct_cat != CCORE::NTT) {
auto p_ = p, q_ = q;
while (n) {
auto _ = q_;
for (u32 i = 1; i < _.size(); i += 2) _[i] = -_[i];
auto s = p_ * _, t = q_ * _;
for (u32 i = n & 1; i < s.size(); i += 2) p_[i / 2] = s[i];
for (u32 i = 0; i < t.size(); i += 2) q_[i / 2] = t[i];
n /= 2;
}
return p_[0];
} else {
auto& core = poly_t::conv_core;
auto core2 = core;
cu32 m = (u32)q.size();
core.bzr(m), core2.bzr(core.size() * 2);
auto q_ = q;
core.dif(q_), q_.resize(core2.size());
auto iq = bostan_mori_impl_::coeff_(core, core2, q_, n, m - 1);
TPN poly_t::val_t res = 0;
flt_ (u32, i, 0, iq.size()) res += p[i] * iq[iq.size() - 1 - i];
return res;
}
}
} // namespace tifa_libs
#line 2 "src/math/lrec/berlekamp_massey/lib.hpp"
#line 4 "src/math/lrec/berlekamp_massey/lib.hpp"
namespace tifa_libs {
template <class T>
CEXP vec<T> berlekamp_massey(vec<T> CR a) NE {
cu32 n = (u32)a.size();
vec<T> b{1}, c{1};
b.reserve(n + 1), c.reserve(n + 1);
T y = 1;
flt_ (u32, k, 1, n + 1) {
u32 l = (u32)c.size();
T x = 0;
flt_ (u32, i, 0, l) x += c[i] * a[k - l + i];
b.push_back(0);
u32 m = (u32)b.size();
if (x == 0) continue;
if (const T d_ = x / y; l < m) {
const auto _ = c;
c.insert(begin(c), m - l, 0);
flt_ (u32, i, 0, m) c[m - 1 - i] -= d_ * b[m - 1 - i];
b = _, y = x;
} else
flt_ (u32, i, 0, m) c[l - 1 - i] -= d_ * b[m - 1 - i];
}
reverse(c);
return c;
}
} // namespace tifa_libs
#line 5 "src/math/lrec/nth_term/lib.hpp"
namespace tifa_libs {
template <class poly, std::same_as<TPN poly::val_t> mint>
CEXP mint nth_term_lrec(u64 n, vec<mint> CR a, vec<mint> CR bm) NE {
if (n < a.size()) return a[n];
assert(!bm.empty() && bm[0] == 1);
poly q(bm);
q.strip();
return bostan_mori(n, (poly(a) * q).pre((u32)q.size() - 1), q);
}
template <class poly, std::same_as<TPN poly::val_t> mint>
CEXP mint nth_term_lrec(u64 n, vec<mint> CR a) NE {
if (n < a.size()) return a[n];
auto bm = berlekamp_massey(a);
return nth_term_lrec<poly, mint>(n, a, bm);
}
} // namespace tifa_libs